mirror of
https://github.com/MontFerret/ferret.git
synced 2025-01-04 03:02:02 +02:00
a3d3fe727d
* Made custom and random UA optional * Added pirvate context keys
195 lines
3.6 KiB
Go
195 lines
3.6 KiB
Go
package dynamic
|
|
|
|
import (
|
|
"context"
|
|
"github.com/MontFerret/ferret/pkg/html/common"
|
|
"github.com/MontFerret/ferret/pkg/runtime/logging"
|
|
"github.com/MontFerret/ferret/pkg/runtime/values"
|
|
"github.com/mafredri/cdp"
|
|
"github.com/mafredri/cdp/devtool"
|
|
"github.com/mafredri/cdp/protocol/emulation"
|
|
"github.com/mafredri/cdp/protocol/page"
|
|
"github.com/mafredri/cdp/protocol/target"
|
|
"github.com/mafredri/cdp/rpcc"
|
|
"github.com/mafredri/cdp/session"
|
|
"github.com/pkg/errors"
|
|
"sync"
|
|
)
|
|
|
|
type Driver struct {
|
|
sync.Mutex
|
|
dev *devtool.DevTools
|
|
conn *rpcc.Conn
|
|
client *cdp.Client
|
|
session *session.Manager
|
|
contextID target.BrowserContextID
|
|
options *Options
|
|
}
|
|
|
|
func NewDriver(address string, opts ...Option) *Driver {
|
|
drv := new(Driver)
|
|
drv.dev = devtool.New(address)
|
|
drv.options = new(Options)
|
|
|
|
for _, opt := range opts {
|
|
opt(drv.options)
|
|
}
|
|
|
|
return drv
|
|
}
|
|
|
|
func (drv *Driver) GetDocument(ctx context.Context, targetURL values.String) (values.HTMLNode, error) {
|
|
logger := logging.FromContext(ctx)
|
|
|
|
err := drv.init(ctx)
|
|
|
|
if err != nil {
|
|
logger.
|
|
Error().
|
|
Err(err).
|
|
Str("driver", "dynamic").
|
|
Msg("failed to initialize the driver")
|
|
|
|
return nil, err
|
|
}
|
|
|
|
ctx, cancel := context.WithTimeout(ctx, DefaultTimeout)
|
|
defer cancel()
|
|
|
|
url := targetURL.String()
|
|
|
|
if url == "" {
|
|
url = BlankPageURL
|
|
}
|
|
|
|
// Create a new target belonging to the browser context, similar
|
|
// to opening a new tab in an incognito window.
|
|
createTargetArgs := target.NewCreateTargetArgs(url).SetBrowserContextID(drv.contextID)
|
|
createTarget, err := drv.client.Target.CreateTarget(ctx, createTargetArgs)
|
|
|
|
if err != nil {
|
|
logger.
|
|
Error().
|
|
Err(err).
|
|
Str("driver", "dynamic").
|
|
Msg("failed to create a browser target")
|
|
|
|
return nil, err
|
|
}
|
|
|
|
// Connect to target using the existing websocket connection.
|
|
conn, err := drv.session.Dial(ctx, createTarget.TargetID)
|
|
|
|
if err != nil {
|
|
logger.
|
|
Error().
|
|
Err(err).
|
|
Str("driver", "dynamic").
|
|
Msg("failed to establish a connection")
|
|
|
|
return nil, err
|
|
}
|
|
|
|
client := cdp.NewClient(conn)
|
|
|
|
err = runBatch(
|
|
func() error {
|
|
return client.Page.Enable(ctx)
|
|
},
|
|
|
|
func() error {
|
|
return client.Page.SetLifecycleEventsEnabled(
|
|
ctx,
|
|
page.NewSetLifecycleEventsEnabledArgs(true),
|
|
)
|
|
},
|
|
|
|
func() error {
|
|
return client.DOM.Enable(ctx)
|
|
},
|
|
|
|
func() error {
|
|
return client.Runtime.Enable(ctx)
|
|
},
|
|
|
|
func() error {
|
|
ua := common.GetUserAgent(drv.options.userAgent)
|
|
|
|
logger.
|
|
Debug().
|
|
Str("user-agent", ua).
|
|
Msg("using User-Agent")
|
|
|
|
// do not use custom user agent
|
|
if ua == "" {
|
|
return nil
|
|
}
|
|
|
|
return client.Emulation.SetUserAgentOverride(
|
|
ctx,
|
|
emulation.NewSetUserAgentOverrideArgs(ua),
|
|
)
|
|
},
|
|
)
|
|
|
|
return LoadHTMLDocument(ctx, conn, client, url)
|
|
}
|
|
|
|
func (drv *Driver) Close() error {
|
|
drv.Lock()
|
|
defer drv.Unlock()
|
|
|
|
if drv.session != nil {
|
|
drv.session.Close()
|
|
|
|
return drv.conn.Close()
|
|
}
|
|
|
|
return nil
|
|
}
|
|
|
|
func (drv *Driver) init(ctx context.Context) error {
|
|
drv.Lock()
|
|
defer drv.Unlock()
|
|
|
|
if drv.session == nil {
|
|
ver, err := drv.dev.Version(ctx)
|
|
|
|
if err != nil {
|
|
return errors.Wrap(err, "failed to initialize driver")
|
|
}
|
|
|
|
bconn, err := rpcc.DialContext(ctx, ver.WebSocketDebuggerURL)
|
|
|
|
if err != nil {
|
|
return errors.Wrap(err, "failed to initialize driver")
|
|
}
|
|
|
|
bc := cdp.NewClient(bconn)
|
|
|
|
sess, err := session.NewManager(bc)
|
|
|
|
if err != nil {
|
|
bconn.Close()
|
|
|
|
return errors.Wrap(err, "failed to initialize driver")
|
|
}
|
|
|
|
createCtx, err := bc.Target.CreateBrowserContext(ctx)
|
|
|
|
if err != nil {
|
|
bconn.Close()
|
|
sess.Close()
|
|
|
|
return err
|
|
}
|
|
|
|
drv.conn = bconn
|
|
drv.client = bc
|
|
drv.session = sess
|
|
drv.contextID = createCtx.BrowserContextID
|
|
}
|
|
|
|
return nil
|
|
}
|