Good afternoon,
I need to scrape quite a lot of information from a web page for my master's degree final project and I am unable to make it work. It doesn't scrape the simplest things and I'm starting to suspect that it's a problem with the interaction between the page and the application.
I hope someone can help me because it is important to me. I would be very grateful
You have to use pagination and multilevels. Still, I see it simple to do but something is going wrong.
Url: European leagues & cups | Transfermarkt
Sitemap:
{"_id":"ligas","startUrl":["https://www.transfermarkt.com/wettbewerbe/europa/wettbewerbe"],"selectors":[{"delay":0,"id":"leagues","multiple":true,"parentSelectors":["_root","Pagination"],"selector":".inline-table a[title]","type":"SelectorLink"},{"delay":0,"id":"teams","multiple":true,"parentSelectors":["leagues"],"selector":"#yw1 .hauptlink a[title]","type":"SelectorLink"},{"delay":0,"id":"players","multiple":true,"parentSelectors":["teams"],"selector":".di .hide-for-small a","type":"SelectorLink"},{"delay":0,"id":"face","multiple":false,"parentSelectors":["players"],"selector":"img.data-header__profile-image","type":"SelectorImage"},{"delay":0,"id":"birth","multiple":false,"parentSelectors":["players"],"regex":"","selector":"span[itemprop='birthDate']","type":"SelectorText"},{"delay":0,"id":"team","multiple":false,"parentSelectors":["players"],"regex":"","selector":"[itemprop='affiliation'] a","type":"SelectorText"},{"delay":0,"id":"joined","multiple":false,"parentSelectors":["players"],"regex":"","selector":"span:nth-of-type(4) span","type":"SelectorText"},{"delay":0,"id":"marketValue","multiple":false,"parentSelectors":["players"],"regex":"","selector":"div.tm-player-market-value-development__current-value","type":"SelectorText"},{"delay":0,"id":"injuries","multiple":false,"parentSelectors":["players"],"selector":"div:nth-of-type(4) li:nth-of-type(1) a","type":"SelectorLink"},{"columns":[{"extract":true,"header":"Season","name":"Season"},{"extract":true,"header":"Injury","name":"Injury"},{"extract":true,"header":"from","name":"from"},{"extract":true,"header":"until","name":"until"},{"extract":true,"header":"Days","name":"Days"},{"extract":true,"header":"Games missed","name":"Games missed"}],"delay":0,"id":"injuriesTable","multiple":true,"parentSelectors":["injuries"],"selector":"table","tableDataRowSelector":"tbody tr","tableHeaderRowSelector":"thead tr","type":"SelectorTable"},{"delay":0,"id":"Pagination","multiple":true,"parentSelectors":["_root","Pagination"],"selector":"a.tm-pagination__link","type":"SelectorLink"}]}
