2019-03-15 19:59:05 -04:00
|
|
|
LET doc = DOCUMENT('https://www.theverge.com/tech', {
|
2021-09-02 11:09:48 -04:00
|
|
|
driver: "cdp",
|
|
|
|
ignore: {
|
|
|
|
resources: [
|
|
|
|
{
|
|
|
|
url: "*",
|
|
|
|
type: "image"
|
|
|
|
}
|
|
|
|
]
|
|
|
|
}
|
2019-03-15 19:59:05 -04:00
|
|
|
})
|
2021-09-02 11:09:48 -04:00
|
|
|
|
2018-10-05 23:36:23 -04:00
|
|
|
WAIT_ELEMENT(doc, '.c-compact-river__entry', 5000)
|
|
|
|
LET articles = ELEMENTS(doc, '.c-entry-box--compact__image-wrapper')
|
|
|
|
LET links = (
|
|
|
|
FOR article IN articles
|
2021-09-02 11:09:48 -04:00
|
|
|
FILTER article.attributes?.href LIKE 'https://www.theverge.com/*'
|
2018-10-05 23:36:23 -04:00
|
|
|
RETURN article.attributes.href
|
|
|
|
)
|
2021-09-02 11:09:48 -04:00
|
|
|
|
2018-10-05 23:36:23 -04:00
|
|
|
FOR link IN links
|
2018-10-07 20:15:41 -04:00
|
|
|
// The Verge has pretty heavy pages, so let's increase the navigation wait time
|
2018-10-07 21:23:36 -04:00
|
|
|
NAVIGATE(doc, link, 20000)
|
2021-09-02 11:09:48 -04:00
|
|
|
WAIT_ELEMENT(doc, '.c-entry-content', 15000)
|
2018-10-05 23:36:23 -04:00
|
|
|
LET texter = ELEMENT(doc, '.c-entry-content')
|
|
|
|
RETURN texter.innerText
|