nuclei/v2/pkg/protocols/headless/engine/page_actions.go

537 lines
14 KiB
Go
Raw Normal View History

package engine
import (
"io/ioutil"
"net"
"net/url"
"regexp"
"strconv"
"strings"
"time"
"github.com/go-rod/rod"
"github.com/go-rod/rod/lib/proto"
"github.com/pkg/errors"
"github.com/segmentio/ksuid"
"github.com/valyala/fasttemplate"
)
// ExecuteActions executes a list of actions on a page.
func (p *Page) ExecuteActions(baseURL *url.URL, actions []*Action) (map[string]string, error) {
var err error
outData := make(map[string]string)
for _, act := range actions {
actionType := ActionStringToAction[act.ActionType]
switch actionType {
case ActionNavigate:
err = p.NavigateURL(act, outData, baseURL)
case ActionScript:
err = p.RunScript(act, outData)
case ActionClick:
err = p.ClickElement(act, outData)
case ActionRightClick:
err = p.RightClickElement(act, outData)
case ActionTextInput:
err = p.InputElement(act, outData)
case ActionScreenshot:
err = p.Screenshot(act, outData)
case ActionTimeInput:
err = p.TimeInputElement(act, outData)
case ActionSelectInput:
err = p.SelectInputElement(act, outData)
case ActionWaitLoad:
err = p.WaitLoad(act, outData)
case ActionGetResource:
err = p.GetResource(act, outData)
case ActionExtract:
err = p.SelectInputElement(act, outData)
case ActionWaitEvent:
err = p.WaitEvent(act, outData)
case ActionFilesInput:
err = p.FilesInput(act, outData)
case ActionAddHeader:
err = p.ActionAddHeader(act, outData)
case ActionSetHeader:
err = p.ActionSetHeader(act, outData)
case ActionDeleteHeader:
err = p.ActionDeleteHeader(act, outData)
case ActionSetBody:
err = p.ActionSetBody(act, outData)
case ActionSetMethod:
err = p.ActionSetMethod(act, outData)
case ActionKeyboard:
err = p.KeyboardAction(act, outData)
2021-03-01 08:50:56 +00:00
case ActionDebug:
err = p.DebugAction(act, outData)
case ActionSleep:
err = p.SleepAction(act, outData)
default:
continue
}
if err != nil {
2021-02-26 07:43:11 +00:00
return nil, errors.Wrap(err, "error occurred executing action")
}
}
return outData, nil
}
type requestRule struct {
Action ActionType
Part string
Args map[string]string
}
// ActionAddHeader executes a AddHeader action.
func (p *Page) ActionAddHeader(act *Action, out map[string]string) error {
in := act.GetArg("part")
args := make(map[string]string)
args["key"] = act.GetArg("key")
args["value"] = act.GetArg("value")
rule := requestRule{
Action: ActionAddHeader,
Part: in,
Args: args,
}
p.rules = append(p.rules, rule)
return nil
}
// ActionSetHeader executes a SetHeader action.
func (p *Page) ActionSetHeader(act *Action, out map[string]string) error {
in := act.GetArg("part")
args := make(map[string]string)
args["key"] = act.GetArg("key")
args["value"] = act.GetArg("value")
rule := requestRule{
Action: ActionSetHeader,
Part: in,
Args: args,
}
p.rules = append(p.rules, rule)
return nil
}
// ActionDeleteHeader executes a DeleteHeader action.
func (p *Page) ActionDeleteHeader(act *Action, out map[string]string) error {
in := act.GetArg("part")
args := make(map[string]string)
args["key"] = act.GetArg("key")
rule := requestRule{
Action: ActionDeleteHeader,
Part: in,
Args: args,
}
p.rules = append(p.rules, rule)
return nil
}
// ActionSetBody executes a SetBody action.
func (p *Page) ActionSetBody(act *Action, out map[string]string) error {
in := act.GetArg("part")
args := make(map[string]string)
args["body"] = act.GetArg("body")
rule := requestRule{
Action: ActionSetBody,
Part: in,
Args: args,
}
p.rules = append(p.rules, rule)
return nil
}
// ActionSetMethod executes an SetMethod action.
func (p *Page) ActionSetMethod(act *Action, out map[string]string) error {
in := act.GetArg("part")
args := make(map[string]string)
args["method"] = act.GetArg("method")
rule := requestRule{
Action: ActionSetMethod,
Part: in,
Args: args,
}
p.rules = append(p.rules, rule)
return nil
}
// NavigateURL executes an ActionLoadURL actions loading a URL for the page.
func (p *Page) NavigateURL(action *Action, out map[string]string, parsed *url.URL) error {
2021-02-26 07:43:11 +00:00
URL := action.GetArg("url")
if URL == "" {
return errors.New("invalid arguments provided")
}
2021-02-26 07:43:11 +00:00
// Handle the dynamic value substitution here.
URL, parsed = baseURLWithTemplatePrefs(URL, parsed)
values := map[string]interface{}{"Hostname": parsed.Hostname()}
2021-02-26 07:43:11 +00:00
if strings.HasSuffix(parsed.Path, "/") && strings.Contains(URL, "{{BaseURL}}/") {
parsed.Path = strings.TrimSuffix(parsed.Path, "/")
}
parsedString := parsed.String()
values["BaseURL"] = parsedString
2021-02-26 07:43:11 +00:00
final := fasttemplate.ExecuteStringStd(URL, "{{", "}}", values)
err := p.page.Navigate(final)
if err != nil {
return errors.Wrap(err, "could not navigate")
}
return nil
}
// RunScript runs a script on the loaded page
func (p *Page) RunScript(action *Action, out map[string]string) error {
code := action.GetArg("code")
if code == "" {
return errors.New("invalid arguments provided")
}
if action.GetArg("hook") == "true" {
if _, err := p.page.EvalOnNewDocument(code); err != nil {
return err
}
}
data, err := p.page.Eval(code)
if err != nil {
return err
}
2021-02-25 07:07:47 +00:00
if data != nil && action.Name != "" {
out[action.Name] = data.Value.String()
}
return nil
}
// ClickElement executes click actions for an element.
func (p *Page) ClickElement(act *Action, out map[string]string) error {
element, err := p.pageElementBy(act.Data)
if err != nil {
return errors.Wrap(err, "could not get element")
}
if err = element.ScrollIntoView(); err != nil {
return errors.Wrap(err, "could not scroll into view")
}
if err = element.Click(proto.InputMouseButtonLeft); err != nil {
return errors.Wrap(err, "could not click element")
}
return nil
}
// KeyboardAction executes a keyboard action on the page.
func (p *Page) KeyboardAction(act *Action, out map[string]string) error {
return p.page.Keyboard.Press([]rune(act.GetArg("keys"))...)
}
// RightClickElement executes right click actions for an element.
func (p *Page) RightClickElement(act *Action, out map[string]string) error {
element, err := p.pageElementBy(act.Data)
if err != nil {
return errors.Wrap(err, "could not get element")
}
if err = element.ScrollIntoView(); err != nil {
return errors.Wrap(err, "could not scroll into view")
}
if err = element.Click(proto.InputMouseButtonRight); err != nil {
return errors.Wrap(err, "could not right click element")
}
return nil
}
// Screenshot executes screenshot action on a page
func (p *Page) Screenshot(act *Action, out map[string]string) error {
to := act.GetArg("to")
if to == "" {
to = ksuid.New().String()
2021-03-06 09:01:21 +00:00
if act.Name != "" {
out[act.Name] = to
}
}
var data []byte
var err error
if act.GetArg("fullpage") == "true" {
data, err = p.page.Screenshot(true, &proto.PageCaptureScreenshot{})
} else {
data, err = p.page.Screenshot(false, &proto.PageCaptureScreenshot{})
}
if err != nil {
return errors.Wrap(err, "could not take screenshot")
}
err = ioutil.WriteFile(to+".png", data, 0540)
if err != nil {
return errors.Wrap(err, "could not write screenshot")
}
return nil
}
// InputElement executes input element actions for an element.
func (p *Page) InputElement(act *Action, out map[string]string) error {
value := act.GetArg("value")
if value == "" {
return errors.New("invalid arguments provided")
}
element, err := p.pageElementBy(act.Data)
if err != nil {
return errors.Wrap(err, "could not get element")
}
if err = element.ScrollIntoView(); err != nil {
return errors.Wrap(err, "could not scroll into view")
}
if err = element.Input(value); err != nil {
return errors.Wrap(err, "could not input element")
}
return nil
}
// TimeInputElement executes time input on an element
func (p *Page) TimeInputElement(act *Action, out map[string]string) error {
value := act.GetArg("value")
if value == "" {
return errors.New("invalid arguments provided")
}
element, err := p.pageElementBy(act.Data)
if err != nil {
return errors.Wrap(err, "could not get element")
}
if err = element.ScrollIntoView(); err != nil {
return errors.Wrap(err, "could not scroll into view")
}
t, err := time.Parse(time.RFC3339, value)
if err != nil {
return errors.Wrap(err, "could not parse time")
}
if err := element.InputTime(t); err != nil {
return errors.Wrap(err, "could not input element")
}
return nil
}
// SelectInputElement executes select input statement action on a element
func (p *Page) SelectInputElement(act *Action, out map[string]string) error {
value := act.GetArg("value")
if value == "" {
return errors.New("invalid arguments provided")
}
element, err := p.pageElementBy(act.Data)
if err != nil {
return errors.Wrap(err, "could not get element")
}
if err = element.ScrollIntoView(); err != nil {
return errors.Wrap(err, "could not scroll into view")
}
selectedbool := false
if act.GetArg("selected") == "true" {
selectedbool = true
}
by := act.GetArg("selector")
if err := element.Select([]string{value}, selectedbool, selectorBy(by)); err != nil {
return errors.Wrap(err, "could not select input")
}
return nil
}
// WaitLoad waits for the page to load
func (p *Page) WaitLoad(act *Action, out map[string]string) error {
p.page.Timeout(1 * time.Second).WaitNavigation(proto.PageLifecycleEventNameDOMContentLoaded)()
// Wait for the window.onload event and also wait for the network requests
// to become idle for a maximum duration of 2 seconds. If the requests
// do not finish,
if err := p.page.WaitLoad(); err != nil {
return errors.Wrap(err, "could not reset mouse")
}
_ = p.page.WaitIdle(1 * time.Second)
return nil
}
// GetResource gets a resource from an element from page.
func (p *Page) GetResource(act *Action, out map[string]string) error {
element, err := p.pageElementBy(act.Data)
if err != nil {
return errors.Wrap(err, "could not get element")
}
resource, err := element.Resource()
if err != nil {
return errors.Wrap(err, "could not get src for element")
}
2021-03-06 09:01:21 +00:00
if act.Name != "" {
out[act.Name] = string(resource)
}
return nil
}
// FilesInput acts with a file input element on page
func (p *Page) FilesInput(act *Action, out map[string]string) error {
element, err := p.pageElementBy(act.Data)
if err != nil {
return errors.Wrap(err, "could not get element")
}
if err = element.ScrollIntoView(); err != nil {
return errors.Wrap(err, "could not scroll into view")
}
value := act.GetArg("value")
filesPaths := strings.Split(value, ",")
if err := element.SetFiles(filesPaths); err != nil {
return errors.Wrap(err, "could not set files")
}
return nil
}
// ExtractElement extracts from an element on the page.
func (p *Page) ExtractElement(act *Action, out map[string]string) error {
element, err := p.pageElementBy(act.Data)
if err != nil {
return errors.Wrap(err, "could not get element")
}
if err = element.ScrollIntoView(); err != nil {
return errors.Wrap(err, "could not scroll into view")
}
switch act.GetArg("target") {
case "attribute":
attrName := act.GetArg("attribute")
if attrName == "" {
return errors.New("attribute can't be empty")
}
attrValue, err := element.Attribute(attrName)
if err != nil {
return errors.Wrap(err, "could not get attribute")
}
2021-03-06 09:01:21 +00:00
if act.Name != "" {
out[act.Name] = *attrValue
}
default:
text, err := element.Text()
if err != nil {
return errors.Wrap(err, "could not get element text node")
}
2021-03-06 09:01:21 +00:00
if act.Name != "" {
out[act.Name] = text
}
}
return nil
}
type protoEvent struct {
event string
}
// ProtoEvent returns the cdp.Event.Method
func (p *protoEvent) ProtoEvent() string {
return p.event
}
// WaitEvent waits for an event to happen on the page.
func (p *Page) WaitEvent(act *Action, out map[string]string) error {
event := act.GetArg("event")
if event == "" {
return errors.New("event not recognized")
}
protoEvent := &protoEvent{event: event}
// Uses another instance in order to be able to chain the timeout only to the wait operation
pagec := p.page
timeout := act.GetArg("timeout")
if timeout != "" {
ts, err := strconv.Atoi(timeout)
if err != nil {
return errors.Wrap(err, "could not get timeout")
}
if ts > 0 {
pagec = p.page.Timeout(time.Duration(ts) * time.Second)
}
}
// Just wait the event to happen
pagec.WaitEvent(protoEvent)()
return nil
}
// pageElementBy returns a page element from a variety of inputs.
//
// Supported values for by: r -> selector & regex, x -> xpath, js -> eval js,
// search => query, default ("") => selector.
func (p *Page) pageElementBy(data map[string]string) (*rod.Element, error) {
by, ok := data["by"]
if !ok {
by = ""
}
page := p.page
switch by {
2021-02-25 07:07:47 +00:00
case "r", "regex":
return page.ElementR(data["selector"], data["regex"])
case "x", "xpath":
return page.ElementX(data["xpath"])
case "js":
return page.ElementByJS(&rod.EvalOptions{JS: data["js"]})
case "search":
elms, err := page.Search(0, 1, data["query"])
if err != nil {
return nil, err
}
if len(elms) > 0 {
return elms[0], nil
}
return nil, errors.New("no such element")
default:
return page.Element(data["selector"])
}
}
2021-03-01 08:50:56 +00:00
// DebugAction enables debug action on a page.
func (p *Page) DebugAction(act *Action, out map[string]string) error {
p.instance.browser.engine.SlowMotion(5 * time.Second)
p.instance.browser.engine.Trace(true)
return nil
}
// SleepAction sleeps on the page for a specified duration
func (p *Page) SleepAction(act *Action, out map[string]string) error {
seconds := act.Data["duration"]
if seconds == "" {
seconds = "5"
}
parsed, err := strconv.Atoi(seconds)
if err != nil {
return err
}
time.Sleep(time.Duration(parsed) * time.Second)
return nil
}
// selectorBy returns a selector from a representation.
func selectorBy(selector string) rod.SelectorType {
switch selector {
case "r":
return rod.SelectorTypeRegex
case "css":
return rod.SelectorTypeCSSSector
case "regex":
return rod.SelectorTypeRegex
default:
return rod.SelectorTypeText
}
}
var (
urlWithPortRegex = regexp.MustCompile(`{{BaseURL}}:(\d+)`)
)
// baseURLWithTemplatePrefs returns the url for BaseURL keeping
// the template port and path preference over the user provided one.
func baseURLWithTemplatePrefs(data string, parsed *url.URL) (string, *url.URL) {
// template port preference over input URL port if template has a port
matches := urlWithPortRegex.FindAllStringSubmatch(data, -1)
if len(matches) == 0 {
return data, parsed
}
port := matches[0][1]
parsed.Host = net.JoinHostPort(parsed.Hostname(), port)
data = strings.ReplaceAll(data, ":"+port, "")
if parsed.Path == "" {
parsed.Path = "/"
}
return data, parsed
}