mirror of
https://github.com/orangecoding/fredy.git
synced 2026-06-16 12:31:07 +00:00
48 lines
1.6 KiB
JavaScript
Executable File
48 lines
1.6 KiB
JavaScript
Executable File
import utils from '../utils.js';
|
|
|
|
let appliedBlackList = [];
|
|
|
|
function normalize(o) {
|
|
const id = o.id.substring(o.id.indexOf('-') + 1, o.id.length);
|
|
const size = o.size || 'N/A m²';
|
|
const price = (o.price || '--- €').replace('Preis auf Anfrage', '--- €');
|
|
const title = o.title || 'No title available';
|
|
const link = `https://immo.swp.de/immobilien/${id}`;
|
|
const description = o.description;
|
|
return Object.assign(o, {id, price, size, title, link, description});
|
|
}
|
|
|
|
function applyBlacklist(o) {
|
|
const titleNotBlacklisted = !utils.isOneOf(o.title, appliedBlackList);
|
|
const descNotBlacklisted = !utils.isOneOf(o.description, appliedBlackList);
|
|
return titleNotBlacklisted && descNotBlacklisted;
|
|
}
|
|
|
|
const config = {
|
|
url: null,
|
|
crawlContainer: '.js-serp-item',
|
|
sortByDateParam: 's=most_recently_updated_first',
|
|
crawlFields: {
|
|
id: '.js-bookmark-btn@data-id',
|
|
price: 'div.align-items-start div:first-child | trim',
|
|
size: 'div.align-items-start div:nth-child(3) | trim',
|
|
title: '.card-title h2 | trim',
|
|
link: '.ci-search-result__link@href',
|
|
description: '.js-show-more-item-sm | removeNewline | trim',
|
|
},
|
|
paginate: 'li.page-item.pagination__item a.page-link@href',
|
|
normalize: normalize,
|
|
filter: applyBlacklist,
|
|
};
|
|
export const init = (sourceConfig, blacklist) => {
|
|
config.enabled = sourceConfig.enabled;
|
|
config.url = sourceConfig.url;
|
|
appliedBlackList = blacklist || [];
|
|
};
|
|
export const metaInformation = {
|
|
name: 'Immo Südwest Presse',
|
|
baseUrl: 'https://immo.swp.de/',
|
|
id: 'immoswp',
|
|
};
|
|
export {config};
|