1
0
mirror of https://github.com/MontFerret/ferret.git synced 2024-12-16 11:37:36 +02:00
ferret/pkg/stdlib/html/pagination.go
Tim Voronov 34c8c02258
Refactoring/externalized html (#234)
* Externalized HTML drivers

* Fixed unit tests

* Updated logging

* Added support to set default driver

* Updated GetIn and SetIn helpers
2019-02-19 18:10:18 -05:00

108 lines
2.1 KiB
Go

package html
import (
"context"
"github.com/MontFerret/ferret/pkg/drivers"
"github.com/MontFerret/ferret/pkg/runtime/core"
"github.com/MontFerret/ferret/pkg/runtime/values"
"github.com/MontFerret/ferret/pkg/runtime/values/types"
)
// Pagination creates an iterator that goes through pages using CSS selector.
// The iterator starts from the current page i.e. it does not change the page on 1st iteration.
// That allows you to keep scraping logic inside FOR loop.
// @param doc (Document) - Target document.
// @param selector (String) - CSS selector for a pagination on the page.
func Pagination(_ context.Context, args ...core.Value) (core.Value, error) {
err := core.ValidateArgs(args, 2, 2)
if err != nil {
return values.None, err
}
doc, err := toDocument(args[0])
if err != nil {
return values.None, err
}
err = core.ValidateType(args[1], types.String)
if err != nil {
return values.None, err
}
selector := args[1].(values.String)
return &Paging{doc, selector}, nil
}
var PagingType = core.NewType("paging")
type (
Paging struct {
document drivers.HTMLDocument
selector values.String
}
PagingIterator struct {
document drivers.HTMLDocument
selector values.String
pos values.Int
}
)
func (p *Paging) MarshalJSON() ([]byte, error) {
return nil, core.ErrInvalidOperation
}
func (p *Paging) Type() core.Type {
return PagingType
}
func (p *Paging) String() string {
return PagingType.String()
}
func (p *Paging) Compare(_ core.Value) int64 {
return 1
}
func (p *Paging) Unwrap() interface{} {
return nil
}
func (p *Paging) Hash() uint64 {
return 0
}
func (p *Paging) Copy() core.Value {
return values.None
}
func (p *Paging) Iterate(_ context.Context) (core.Iterator, error) {
return &PagingIterator{p.document, p.selector, -1}, nil
}
func (i *PagingIterator) Next(_ context.Context) (core.Value, core.Value, error) {
i.pos++
if i.pos == 0 {
return values.ZeroInt, values.ZeroInt, nil
}
clicked, err := i.document.ClickBySelector(i.selector)
if err != nil {
return values.None, values.None, err
}
if clicked {
return i.pos, i.pos, nil
}
// terminate
return values.None, values.None, nil
}