mirror of
https://github.com/orangecoding/fredy.git
synced 2026-06-16 12:31:07 +00:00
fixing immowelt crawler
This commit is contained in:
@@ -3,7 +3,7 @@ const config = require('../../conf/config.json');
|
||||
const utils = require('../utils');
|
||||
|
||||
function normalize(o) {
|
||||
const size = o.size.split('Wohnfläche')[0];
|
||||
const size = o.size.split('Wohnfläche')[1].replace(' (ca.) ', '');
|
||||
const address = o.address;
|
||||
|
||||
return Object.assign(o, { size, address });
|
||||
@@ -24,11 +24,10 @@ const immowelt = {
|
||||
crawlFields: {
|
||||
id: '@data-estateid | int',
|
||||
price: '.hardfacts_3 strong | removeNewline | trim',
|
||||
size: '.hardfacts_3 div:nth-child(2):not(.hardfactlabel)| removeNewline | trim',
|
||||
size: '.js-object.listitem_wrap .hardfacts_3 div:nth-child(2)| removeNewline | trim',
|
||||
title: '.listcontent.clear h2',
|
||||
link: 'a@href',
|
||||
description: '.listconten_offset .listmerkmale| removeNewline | trim',
|
||||
address: '.listconten_offset .listlocation| removeNewline | trim'
|
||||
address: '.listcontent .details .listlocation| removeNewline | trim'
|
||||
},
|
||||
paginate: '#pnlPaging #nlbPlus@href',
|
||||
normalize: normalize,
|
||||
|
||||
Reference in New Issue
Block a user