mirror of
https://github.com/orangecoding/fredy.git
synced 2026-06-16 12:31:07 +00:00
51 lines
1.5 KiB
JavaScript
Executable File
51 lines
1.5 KiB
JavaScript
Executable File
const utils = require('../utils');
|
|
|
|
let appliedBlackList = [];
|
|
|
|
function normalize(o) {
|
|
let size = `${o.size.replace(' Wohnfläche ', '').trim()}`;
|
|
if (o.rooms != null) {
|
|
size += ` / / ${o.rooms.trim()}`;
|
|
}
|
|
const link = `https://www.1a-immobilienmarkt.de/expose/${o.id}.html`;
|
|
|
|
return Object.assign(o, { size, link });
|
|
}
|
|
|
|
function applyBlacklist(o) {
|
|
const titleNotBlacklisted = !utils.isOneOf(o.title, appliedBlackList);
|
|
const descNotBlacklisted = !utils.isOneOf(o.description, appliedBlackList);
|
|
|
|
return titleNotBlacklisted && descNotBlacklisted;
|
|
}
|
|
|
|
const config = {
|
|
url: null,
|
|
crawlContainer: '.tabelle',
|
|
sortByDateParam: 'sort_type=newest',
|
|
crawlFields: {
|
|
id: '.inner_object_data input[name="marker_objekt_id"]@value | int',
|
|
price: '.tabelle .inner_object_data .single_data_price | removeNewline | trim',
|
|
size: '.tabelle .inner_object_data .data_boxes div:nth-child(1)',
|
|
rooms: '.tabelle .inner_object_data .data_boxes div:nth-child(2)',
|
|
title: '.tabelle .inner_object_data .tabelle_inhalt_titel_black | removeNewline | trim',
|
|
description: '.tabelle .inner_object_data .objekt_beschreibung | removeNewline | trim',
|
|
},
|
|
normalize: normalize,
|
|
filter: applyBlacklist,
|
|
};
|
|
|
|
exports.init = (sourceConfig, blacklist) => {
|
|
config.enabled = sourceConfig.enabled;
|
|
config.url = sourceConfig.url;
|
|
appliedBlackList = blacklist || [];
|
|
};
|
|
|
|
exports.metaInformation = {
|
|
name: '1a Immobilien',
|
|
baseUrl: 'https://www.1a-immobilienmarkt.de/',
|
|
id: __filename.slice(__dirname.length + 1, -3),
|
|
};
|
|
|
|
exports.config = config;
|