Path: blob/dev/pkg/protocols/headless/request.go
2070 views
package headless12import (3"fmt"4"maps"5"net/url"6"strings"7"time"89"github.com/projectdiscovery/retryablehttp-go"1011"github.com/pkg/errors"1213"github.com/projectdiscovery/gologger"14"github.com/projectdiscovery/nuclei/v3/pkg/fuzz"15"github.com/projectdiscovery/nuclei/v3/pkg/output"16"github.com/projectdiscovery/nuclei/v3/pkg/protocols"17"github.com/projectdiscovery/nuclei/v3/pkg/protocols/common/contextargs"18"github.com/projectdiscovery/nuclei/v3/pkg/protocols/common/generators"19"github.com/projectdiscovery/nuclei/v3/pkg/protocols/common/helpers/eventcreator"20"github.com/projectdiscovery/nuclei/v3/pkg/protocols/common/helpers/responsehighlighter"21"github.com/projectdiscovery/nuclei/v3/pkg/protocols/common/interactsh"22"github.com/projectdiscovery/nuclei/v3/pkg/protocols/headless/engine"23protocolutils "github.com/projectdiscovery/nuclei/v3/pkg/protocols/utils"24templateTypes "github.com/projectdiscovery/nuclei/v3/pkg/templates/types"25"github.com/projectdiscovery/nuclei/v3/pkg/types"26urlutil "github.com/projectdiscovery/utils/url"27)2829var _ protocols.Request = &Request{}3031const errCouldNotGetHtmlElement = "could not get html element"3233// Type returns the type of the protocol request34func (request *Request) Type() templateTypes.ProtocolType {35return templateTypes.HeadlessProtocol36}3738// ExecuteWithResults executes the protocol requests and returns results instead of writing them.39func (request *Request) ExecuteWithResults(input *contextargs.Context, metadata, previous output.InternalEvent, callback protocols.OutputEventCallback) error {40if request.SelfContained {41url, err := extractBaseURLFromActions(request.Steps)42if err != nil {43return err44}45input = contextargs.NewWithInput(input.Context(), url)46}4748if request.options.Browser.UserAgent() == "" {49request.options.Browser.SetUserAgent(request.compiledUserAgent)50}5152vars := protocolutils.GenerateVariablesWithContextArgs(input, false)53optionVars := generators.BuildPayloadFromOptions(request.options.Options)54// add templatecontext variables to varMap55if request.options.HasTemplateCtx(input.MetaInput) {56vars = generators.MergeMaps(vars, request.options.GetTemplateCtx(input.MetaInput).GetAll())57}5859variablesMap := request.options.Variables.Evaluate(vars)60vars = generators.MergeMaps(vars, metadata, optionVars, variablesMap, request.options.Constants)6162// check for operator matches by wrapping callback63gotmatches := false64wrappedCallback := func(results *output.InternalWrappedEvent) {65callback(results)66if results != nil && results.OperatorsResult != nil {67gotmatches = results.OperatorsResult.Matched68}69}70// verify if fuzz elaboration was requested71if len(request.Fuzzing) > 0 {72return request.executeFuzzingRule(input, vars, previous, wrappedCallback)73}74if request.generator != nil {75iterator := request.generator.NewIterator()76for {77value, ok := iterator.Value()78if !ok {79break80}81if gotmatches && (request.StopAtFirstMatch || request.options.Options.StopAtFirstMatch || request.options.StopAtFirstMatch) {82return nil83}84value = generators.MergeMaps(value, vars)85if err := request.executeRequestWithPayloads(input, value, previous, wrappedCallback); err != nil {86return err87}88}89} else {90value := maps.Clone(vars)91if err := request.executeRequestWithPayloads(input, value, previous, wrappedCallback); err != nil {92return err93}94}95return nil96}9798// This function extracts the base URL from actions.99func extractBaseURLFromActions(steps []*engine.Action) (string, error) {100for _, action := range steps {101if action.ActionType.ActionType == engine.ActionNavigate {102navigateURL := action.GetArg("url")103url, err := urlutil.Parse(navigateURL)104if err != nil {105return "", errors.Errorf("could not parse URL '%s': %s", navigateURL, err.Error())106}107return fmt.Sprintf("%s://%s", url.Scheme, url.Host), nil108}109}110return "", errors.New("no navigation action found")111}112113func (request *Request) executeRequestWithPayloads(input *contextargs.Context, payloads map[string]interface{}, previous output.InternalEvent, callback protocols.OutputEventCallback) error {114instance, err := request.options.Browser.NewInstance()115if err != nil {116request.options.Output.Request(request.options.TemplatePath, input.MetaInput.Input, request.Type().String(), err)117request.options.Progress.IncrementFailedRequestsBy(1)118return errors.Wrap(err, errCouldNotGetHtmlElement)119}120defer func() {121_ = instance.Close()122}()123124instance.SetInteractsh(request.options.Interactsh)125126if _, err := url.Parse(input.MetaInput.Input); err != nil {127request.options.Output.Request(request.options.TemplatePath, input.MetaInput.Input, request.Type().String(), err)128request.options.Progress.IncrementFailedRequestsBy(1)129return errors.Wrap(err, errCouldNotGetHtmlElement)130}131options := &engine.Options{132Timeout: time.Duration(request.options.Options.PageTimeout) * time.Second,133DisableCookie: request.DisableCookie,134Options: request.options.Options,135}136137if !options.DisableCookie && input.CookieJar == nil {138return errors.New("cookie reuse enabled but cookie-jar is nil")139}140141out, page, err := instance.Run(input, request.Steps, payloads, options)142if err != nil {143request.options.Output.Request(request.options.TemplatePath, input.MetaInput.Input, request.Type().String(), err)144request.options.Progress.IncrementFailedRequestsBy(1)145return errors.Wrap(err, errCouldNotGetHtmlElement)146}147defer page.Close()148149reqLog := instance.GetRequestLog()150navigatedURL := request.getLastNavigationURLWithLog(reqLog) // also known as matchedURL if there is a match151152request.options.Output.Request(request.options.TemplatePath, input.MetaInput.Input, request.Type().String(), nil)153request.options.Progress.IncrementRequests()154gologger.Verbose().Msgf("Sent Headless request to %s", navigatedURL)155156reqBuilder := &strings.Builder{}157if request.options.Options.Debug || request.options.Options.DebugRequests || request.options.Options.DebugResponse {158gologger.Info().Msgf("[%s] Dumped Headless request for %s", request.options.TemplateID, navigatedURL)159160for _, act := range request.Steps {161if act.ActionType.ActionType == engine.ActionNavigate {162value := act.GetArg("url")163if reqLog[value] != "" {164_, _ = fmt.Fprintf(reqBuilder, "\tnavigate => %v\n", reqLog[value])165} else {166_, _ = fmt.Fprintf(reqBuilder, "%v not found in %v\n", value, reqLog)167}168} else {169actStepStr := act.String()170_, _ = fmt.Fprintf(reqBuilder, "\t%s\n", actStepStr)171}172}173gologger.Debug().Msg(reqBuilder.String())174}175176var responseBody string177html, err := page.Page().Element("html")178if err == nil {179responseBody, _ = html.HTML()180}181182header := out.GetOrDefault("header", "").(string)183184// NOTE(dwisiswant0): `status_code` key should be an integer type.185// Ref: https://github.com/projectdiscovery/nuclei/pull/5545#discussion_r1721291013186statusCode := out.GetOrDefault("status_code", "").(string)187188outputEvent := request.responseToDSLMap(responseBody, header, statusCode, reqBuilder.String(), input.MetaInput.Input, navigatedURL, page.DumpHistory())189// add response fields to template context and merge templatectx variables to output event190request.options.AddTemplateVars(input.MetaInput, request.Type(), request.ID, outputEvent)191if request.options.HasTemplateCtx(input.MetaInput) {192outputEvent = generators.MergeMaps(outputEvent, request.options.GetTemplateCtx(input.MetaInput).GetAll())193}194195maps.Copy(outputEvent, out)196maps.Copy(outputEvent, payloads)197198var event *output.InternalWrappedEvent199if len(page.InteractshURLs) == 0 {200event = eventcreator.CreateEvent(request, outputEvent, request.options.Options.Debug || request.options.Options.DebugResponse)201callback(event)202} else if request.options.Interactsh != nil {203event = &output.InternalWrappedEvent{InternalEvent: outputEvent}204request.options.Interactsh.RequestEvent(page.InteractshURLs, &interactsh.RequestData{205MakeResultFunc: request.MakeResultEvent,206Event: event,207Operators: request.CompiledOperators,208MatchFunc: request.Match,209ExtractFunc: request.Extract,210})211}212if len(page.InteractshURLs) > 0 {213event.UsesInteractsh = true214}215216dumpResponse(event, request.options, responseBody, input.MetaInput.Input)217shouldStopAtFirstMatch := request.StopAtFirstMatch || request.options.StopAtFirstMatch || request.options.Options.StopAtFirstMatch218if shouldStopAtFirstMatch && event.HasOperatorResult() {219return types.ErrNoMoreRequests220}221return nil222}223224func dumpResponse(event *output.InternalWrappedEvent, requestOptions *protocols.ExecutorOptions, responseBody string, input string) {225if requestOptions.Options.Debug || requestOptions.Options.DebugResponse || requestOptions.Options.StoreResponse {226msg := fmt.Sprintf("[%s] Dumped Headless response for %s\n\n", requestOptions.TemplateID, input)227if requestOptions.Options.Debug || requestOptions.Options.DebugResponse {228resp := responsehighlighter.Highlight(event.OperatorsResult, responseBody, requestOptions.Options.NoColor, false)229gologger.Debug().Msgf("%s%s", msg, resp)230}231if requestOptions.Options.StoreResponse {232requestOptions.Output.WriteStoreDebugData(input, requestOptions.TemplateID, "headless", fmt.Sprintf("%s%s", msg, responseBody))233}234}235}236237// executeFuzzingRule executes a fuzzing rule in the template request238func (request *Request) executeFuzzingRule(input *contextargs.Context, payloads map[string]interface{}, previous output.InternalEvent, callback protocols.OutputEventCallback) error {239// check for operator matches by wrapping callback240gotmatches := false241fuzzRequestCallback := func(gr fuzz.GeneratedRequest) bool {242if gotmatches && (request.StopAtFirstMatch || request.options.Options.StopAtFirstMatch || request.options.StopAtFirstMatch) {243return true244}245newInput := input.Clone()246newInput.MetaInput.Input = gr.Request.String()247if err := request.executeRequestWithPayloads(newInput, gr.DynamicValues, previous, callback); err != nil {248return false249}250return true251}252253if _, err := urlutil.Parse(input.MetaInput.Input); err != nil {254return errors.Wrap(err, "could not parse url")255}256baseRequest, err := retryablehttp.NewRequest("GET", input.MetaInput.Input, nil)257if err != nil {258return errors.Wrap(err, "could not create base request")259}260for _, rule := range request.Fuzzing {261err := rule.Execute(&fuzz.ExecuteRuleInput{262Input: input,263Callback: fuzzRequestCallback,264Values: payloads,265BaseRequest: baseRequest,266})267if err == types.ErrNoMoreRequests {268return nil269}270if err != nil {271return errors.Wrap(err, "could not execute rule")272}273}274return nil275}276277// getLastNavigationURL returns last successfully navigated URL278func (request *Request) getLastNavigationURLWithLog(reqLog map[string]string) string {279for i := len(request.Steps) - 1; i >= 0; i-- {280if request.Steps[i].ActionType.ActionType == engine.ActionNavigate {281templateURL := request.Steps[i].GetArg("url")282if reqLog[templateURL] != "" {283return reqLog[templateURL]284}285}286}287return ""288}289290291