2020-06-17 17:37:01 -04:00
|
|
|
LET baseURL = 'https://www.amazon.com/'
|
|
|
|
LET amazon = DOCUMENT(baseURL, { driver: "cdp" })
|
2018-11-12 19:58:12 -05:00
|
|
|
|
|
|
|
INPUT(amazon, '#twotabsearchtextbox', @criteria)
|
2021-09-02 11:09:48 -04:00
|
|
|
CLICK(amazon, '#nav-search-submit-button')
|
2021-11-22 14:36:28 -05:00
|
|
|
|
|
|
|
WAITFOR EVENT "navigation" IN amazon
|
|
|
|
FILTER current.url =~ "www\.amazon\.com\/s\?k="
|
|
|
|
TIMEOUT 50000
|
2018-11-12 19:58:12 -05:00
|
|
|
|
2021-09-02 11:09:48 -04:00
|
|
|
LET resultListSelector = '[data-component-type="s-search-results"]'
|
2020-06-17 17:37:01 -04:00
|
|
|
LET resultItemSelector = '[data-component-type="s-search-result"]'
|
2021-09-02 11:09:48 -04:00
|
|
|
LET nextBtnSelector = '.s-pagination-next:not(.s-pagination-disabled)'
|
2020-06-17 17:37:01 -04:00
|
|
|
LET priceWholeSelector = '.a-price-whole'
|
|
|
|
LET priceFracSelector = '.a-price-fraction'
|
2018-11-12 19:58:12 -05:00
|
|
|
|
|
|
|
LET result = (
|
|
|
|
FOR pageNum IN PAGINATION(amazon, nextBtnSelector)
|
2020-06-17 17:37:01 -04:00
|
|
|
LIMIT @pages
|
2018-11-12 19:58:12 -05:00
|
|
|
|
2021-09-02 11:09:48 -04:00
|
|
|
LET waitSelector = pageNum > 0 ? WAIT_ELEMENT(amazon, resultListSelector) : false
|
2018-11-12 19:58:12 -05:00
|
|
|
|
|
|
|
LET items = (
|
|
|
|
FOR el IN ELEMENTS(amazon, resultItemSelector)
|
2020-06-17 17:37:01 -04:00
|
|
|
LET hasPrice = ELEMENT_EXISTS(el, priceWholeSelector)
|
|
|
|
LET priceWholeTxt = hasPrice ? FIRST(REGEX_MATCH(INNER_TEXT(el, priceWholeSelector), "[0-9]+")) : "0"
|
|
|
|
LET priceFracTxt = hasPrice ? FIRST(REGEX_MATCH(INNER_TEXT(el, priceFracSelector), "[0-9]+")) : "00"
|
|
|
|
LET price = TO_FLOAT(priceWholeTxt + "." + priceFracTxt)
|
|
|
|
LET anchor = ELEMENT(el, "a")
|
|
|
|
|
2018-11-12 19:58:12 -05:00
|
|
|
RETURN {
|
2021-09-02 11:09:48 -04:00
|
|
|
page: pageNum,
|
2020-06-17 17:37:01 -04:00
|
|
|
url: baseURL + anchor.attributes.href,
|
2018-11-12 19:58:12 -05:00
|
|
|
title: INNER_TEXT(el, 'h2'),
|
2020-06-17 17:37:01 -04:00
|
|
|
price
|
2018-11-12 19:58:12 -05:00
|
|
|
}
|
|
|
|
)
|
|
|
|
|
|
|
|
RETURN items
|
|
|
|
)
|
|
|
|
|
|
|
|
RETURN FLATTEN(result)
|