Describe the problem: Linkedin doesn't allow recruiters to download all candidates in Excel format. Sigh.
Anyways, the following sitemap goes through all pages but doesn't result in any scraped data.
I tried the code without the pagination and it scrapes, and I tried the pagination without the candidate data and it traverses all the pages. But together they don't result in anything.
As you can see, I have tried long delay times. No go.
Url: https://www.linkedin.com/talent/hire/173816335/manage/all
Sitemap:
{
"_id":"linkedin",
"startUrl":[
"https://www.linkedin.com/talent/hire/173816335/manage/all"
],
"selectors":[
{
"id":"candidate",
"type":"SelectorElementScroll",
"parentSelectors":[
"_root",
"pagination"
],
"selector":"article.profile-list-item",
"multiple":true,
"delay":"50"
},
{
"id":"Name",
"type":"SelectorText",
"parentSelectors":[
"candidate"
],
"selector":".artdeco-entity-lockup__title a",
"multiple":false,
"regex":"",
"delay":0
},
{
"id":"Subtitle",
"type":"SelectorText",
"parentSelectors":[
"candidate"
],
"selector":".artdeco-entity-lockup__subtitle span",
"multiple":false,
"regex":"",
"delay":0
},
{
"id":"Location",
"type":"SelectorText",
"parentSelectors":[
"candidate"
],
"selector":".artdeco-entity-lockup__metadata div",
"multiple":false,
"regex":"",
"delay":0
},
{
"id":"Industry",
"type":"SelectorText",
"parentSelectors":[
"candidate"
],
"selector":"span[data-test-current-employer-industry]",
"multiple":false,
"regex":"",
"delay":0
},
{
"id":"pagination",
"type":"SelectorElementClick",
"parentSelectors":[
"_root"
],
"selector":"ol.profile-list",
"multiple":false,
"delay":"7000",
"clickElementSelector":".mini-pagination__quick-link [type='chevron-right-icon']",
"clickType":"clickMore",
"discardInitialElements":"do-not-discard",
"clickElementUniquenessType":"uniqueText"
}
]
}