Hi. I'm trying to scrape the questions/comments posted on the Philippines page of the tripadvisor forum but I want to limit the number of pages scraped to the first 50 pages. I tried using the ":not" CSS selector and by using the range url method as suggested in this page but I can't make it work.
Url: https://www.tripadvisor.com/ShowForum-g294245-i3256-Philippines.html
Here's my current sitemap:
{"_id":"tripadvisor-ph","startUrl":["https://www.tripadvisor.com/ShowForum-g294245-i3256-Philippines.html"],"selectors":[{"id":"questions","type":"SelectorLink","parentSelectors":["Main Page"],"selector":"tr:nth-of-type(n+7) b a","multiple":true,"delay":0},{"id":"question title","type":"SelectorText","parentSelectors":["questions"],"selector":".bx01 div.postTitle","multiple":false,"regex":"","delay":0},{"id":"question date","type":"SelectorText","parentSelectors":["questions"],"selector":".bx01 div.postDate","multiple":false,"regex":"","delay":0},{"id":"questioner name","type":"SelectorText","parentSelectors":["questions"],"selector":".bx01 div.username","multiple":false,"regex":"","delay":0},{"id":"question body","type":"SelectorText","parentSelectors":["questions"],"selector":".bx01 div.postBody","multiple":false,"regex":"","delay":0},{"id":"questioner location","type":"SelectorText","parentSelectors":["questions"],"selector":".profile div.location","multiple":false,"regex":"","delay":0},{"id":"Main Page","type":"SelectorElementClick","parentSelectors":["_root"],"selector":"div.balance","multiple":true,"delay":"5000","clickElementSelector":"div.deckTools:nth-of-type(6) a:nth-of-type:not[(100)]","clickType":"clickOnce","discardInitialElements":"do-not-discard","clickElementUniquenessType":"uniqueText"}]}
I would appreciate all you help.
Thanks in advance!