Hello All,
I am willing to scrape data from a website referencing all renting adverts in a city.
There are 79 adverts to be scrapped onto 4 pages.
My sitemap (below) is properly set up, HOWEVER, it does not scrape all 79 ads... Randomly it will scrape 71 ads, then 68 ads, and finally 73 ads.
I tried to add some delay in the page load, but same....
Any idea what could help me please ?
Sitemap:
{"_id":"seloger_roanne2","startUrl":["https://www.seloger.com/list.htm?projects=1&types=1&places=[{ci%3A420187}]&price=NaN%2F450&surface=NaN%2F60&bedrooms=1%2C2&rooms=2%2C3&enterprise=0&qsVersion=1.0&LISTING-LISTpg=[1-8]"],"selectors":[{"id":"details","type":"SelectorLink","parentSelectors":["_root"],"selector":".Card__ContentZone-sc-7insep-3 a.CoveringLink-a3s3kt-0","multiple":true,"delay":0},{"id":"piece","type":"SelectorText","parentSelectors":["details"],"selector":"div.TagsWithIcon__TagContainer-j1x9om-1:nth-of-type(1) div:nth-of-type(2)","multiple":false,"regex":"","delay":0},{"id":"chambre","type":"SelectorText","parentSelectors":["details"],"selector":"div.TagsWithIcon__TagContainer-j1x9om-1:nth-of-type(2) div:nth-of-type(2)","multiple":false,"regex":"","delay":0},{"id":"surface","type":"SelectorText","parentSelectors":["details"],"selector":"div.TagsWithIcon__TagContainer-j1x9om-1:nth-of-type(3) div:nth-of-type(2)","multiple":false,"regex":"","delay":0},{"id":"prix","type":"SelectorText","parentSelectors":["details"],"selector":".Summarystyled__PriceText-tzuaot-10 span.global-styles__TextNoWrap-sc-1aeotog-6","multiple":false,"regex":"","delay":0},{"id":"descriptif","type":"SelectorText","parentSelectors":["details"],"selector":".ShowMoreText__UITextContainer-sc-5ggbbc-0 p","multiple":false,"regex":"","delay":0},{"id":"agence","type":"SelectorText","parentSelectors":["details"],"selector":"h3.LightSummary__Title-f6k8ax-1","multiple":false,"regex":"","delay":0},{"id":"ref","type":"SelectorText","parentSelectors":["details"],"selector":"div.SubHeaderstyled__Reference-sc-1s8qndx-7","multiple":false,"regex":"","delay":0},{"id":"plus1","type":"SelectorText","parentSelectors":["details"],"selector":"figure:nth-of-type(1) figcaption","multiple":false,"regex":"","delay":0},{"id":"plus2","type":"SelectorText","parentSelectors":["details"],"selector":"figure:nth-of-type(2) figcaption","multiple":false,"regex":"","delay":0},{"id":"plus3","type":"SelectorText","parentSelectors":["details"],"selector":"figure:nth-of-type(3) figcaption","multiple":false,"regex":"","delay":0},{"id":"perf_energ","type":"SelectorText","parentSelectors":["details"],"selector":".hJiFNB span.Preview__PreviewTooltipValue-sc-1pa12ii-4","multiple":false,"regex":"","delay":0},{"id":"gaz","type":"SelectorText","parentSelectors":["details"],"selector":".jsgeee span.Preview__PreviewTooltipValue-sc-1pa12ii-4","multiple":false,"regex":"","delay":0},{"id":"quartier","type":"SelectorText","parentSelectors":["details"],"selector":"span.Summarystyled__FakeLink-tzuaot-14","multiple":false,"regex":"","delay":0}]}