Ice3man fa56800fcc
Fuzzing layer enhancements + input-types support (#4477)
* feat: move fuzz package to root directory

* feat: added support for input providers like openapi,postman,etc

* feat: integration of new fuzzing logic in engine

* bugfix: use and instead of or

* fixed lint errors

* go mod tidy

* add new reqresp type + bump utils

* custom http request parser

* use new struct type RequestResponse

* introduce unified input/target provider

* abstract input formats via new inputprovider

* completed input provider refactor

* remove duplicated code

* add sdk method to load targets

* rename component url->path

* add new yaml format + remove duplicated code

* use gopkg.in/yaml.v3 for parsing

* update .gitignore

* refactor/move + docs fuzzing in http protocol

* fuzz: header + query integration test using fuzzplayground

* fix integration test runner in windows

* feat add support for filter in http fuzz

* rewrite header/query integration test with filter

* add replace regex rule

* support kv fuzzing + misc updates

* add path fuzzing example + misc improvements

* fix matchedURL + skip httpx on multi formats

* cookie fuzz integration test

* add json body + params body tests

* feat add multipart/form-data fuzzing support

* add all fuzz body integration test

* misc bug fixes + minor refactor

* add multipart form + body form unit tests

* only run fuzzing templates if -fuzz flag is given

* refactor/move fuzz playground server to pkg

* fix integration test + refactor

* add auth types and strategies

* add file auth provider

* start implementing auth logic in http

* add logic in http protocol

* static auth implemented for http

* default :80,:443 normalization

* feat: dynamic auth init

* feat: dynamic auth using templates

* validate targets count in openapi+swagger

* inputformats: add support to accept variables

* fix workflow integration test

* update lazy cred fetch logic

* fix unit test

* drop postman support

* domain related normalization

* update secrets.yaml file format + misc updates

* add auth prefetch option

* remove old secret files

* add fuzzing+auth related sdk options

* fix/support multiple mode in kv header fuzzing

* rename 'headers' -> 'header' in fuzzing rules

* fix deadlock due to merge conflict resolution

* misc update

* add bool type in parsed value

* add openapi validation+override+ new flags

* misc updates

* remove optional path parameters when unavailable

* fix swagger.yaml file

* misc updates

* update print msg

* multiple openapi validation enchancements + appMode

* add optional params in required_openapi_vars.yaml file

* improve warning/verbose msgs in format

* fix skip-format-validation not working

* use 'params/parameter' instead of 'variable' in openapi

* add retry support for falky tests

* fix nuclei loading ignored templates (#4849)

* fix tag include logic

* fix unit test

* remove quoting in extractor output

* remove quote in debug code command

* feat: issue tracker URLs in JSON + misc fixes (#4855)

* feat: issue tracker URLs in JSON + misc fixes

* misc changes

* feat: status update support for issues

* feat: report metadata generation hook support

* feat: added CLI summary of tickets created

* misc changes

* introduce `disable-unsigned-templates` flag (#4820)

* introduce `disable-unsigned-templates` flag

* minor

* skip instead of exit

* remove duplicate imports

* use stats package + misc enhancements

* force display warning + adjust skipped stats in unsigned count

* include unsigned skipped templates without -dut flag

---------

Co-authored-by: Tarun Koyalwar <tarun@projectdiscovery.io>

* Purge cache on global callback set (#4840)

* purge cache on global callback set

* lint

* purging cache

* purge cache in runner after loading templates

* include internal cache from parsers + add global cache register/purge via config

* remove disable cache purge option

---------

Co-authored-by: Tarun Koyalwar <tarun@projectdiscovery.io>

* misc update

* add application/octet-stream support

* openapi: support path specific params

* misc option + readme update

---------

Co-authored-by: Sandeep Singh <sandeep@projectdiscovery.io>
Co-authored-by: sandeep <8293321+ehsandeep@users.noreply.github.com>
Co-authored-by: Tarun Koyalwar <tarun@projectdiscovery.io>
Co-authored-by: Tarun Koyalwar <45962551+tarunKoyalwar@users.noreply.github.com>
Co-authored-by: Dogan Can Bakir <65292895+dogancanbakir@users.noreply.github.com>
Co-authored-by: Mzack9999 <mzack9999@protonmail.com>
2024-03-14 03:08:53 +05:30

318 lines
10 KiB
Go

package automaticscan
import (
"io"
"net/http"
"os"
"path/filepath"
"strings"
"sync"
"sync/atomic"
"github.com/logrusorgru/aurora"
"github.com/pkg/errors"
"github.com/projectdiscovery/gologger"
"github.com/projectdiscovery/nuclei/v3/pkg/catalog/config"
"github.com/projectdiscovery/nuclei/v3/pkg/catalog/loader"
"github.com/projectdiscovery/nuclei/v3/pkg/core"
"github.com/projectdiscovery/nuclei/v3/pkg/input/provider"
"github.com/projectdiscovery/nuclei/v3/pkg/output"
"github.com/projectdiscovery/nuclei/v3/pkg/protocols"
"github.com/projectdiscovery/nuclei/v3/pkg/protocols/common/contextargs"
"github.com/projectdiscovery/nuclei/v3/pkg/protocols/common/helpers/writer"
"github.com/projectdiscovery/nuclei/v3/pkg/protocols/http/httpclientpool"
httputil "github.com/projectdiscovery/nuclei/v3/pkg/protocols/utils/http"
"github.com/projectdiscovery/nuclei/v3/pkg/scan"
"github.com/projectdiscovery/nuclei/v3/pkg/templates"
"github.com/projectdiscovery/nuclei/v3/pkg/testutils"
"github.com/projectdiscovery/retryablehttp-go"
"github.com/projectdiscovery/useragent"
mapsutil "github.com/projectdiscovery/utils/maps"
sliceutil "github.com/projectdiscovery/utils/slice"
stringsutil "github.com/projectdiscovery/utils/strings"
wappalyzer "github.com/projectdiscovery/wappalyzergo"
"github.com/remeh/sizedwaitgroup"
"gopkg.in/yaml.v2"
)
const (
mappingFilename = "wappalyzer-mapping.yml"
maxDefaultBody = 4 * 1024 * 1024 // 4MB
)
// Options contains configuration options for automatic scan service
type Options struct {
ExecuterOpts protocols.ExecutorOptions
Store *loader.Store
Engine *core.Engine
Target provider.InputProvider
}
// Service is a service for automatic scan execution
type Service struct {
opts protocols.ExecutorOptions
store *loader.Store
engine *core.Engine
target provider.InputProvider
wappalyzer *wappalyzer.Wappalyze
childExecuter *core.ChildExecuter
httpclient *retryablehttp.Client
templateDirs []string // root Template Directories
technologyMappings map[string]string
techTemplates []*templates.Template
ServiceOpts Options
hasResults *atomic.Bool
}
// New takes options and returns a new automatic scan service
func New(opts Options) (*Service, error) {
wappalyzer, err := wappalyzer.New()
if err != nil {
return nil, err
}
// load extra mapping from nuclei-templates for normalization
var mappingData map[string]string
mappingFile := filepath.Join(config.DefaultConfig.GetTemplateDir(), mappingFilename)
if file, err := os.Open(mappingFile); err == nil {
_ = yaml.NewDecoder(file).Decode(&mappingData)
file.Close()
}
if opts.ExecuterOpts.Options.Verbose {
gologger.Verbose().Msgf("Normalized mapping (%d): %v\n", len(mappingData), mappingData)
}
// get template directories
templateDirs, err := getTemplateDirs(opts)
if err != nil {
return nil, err
}
// load tech detect templates
techDetectTemplates, err := LoadTemplatesWithTags(opts, templateDirs, []string{"tech", "detect", "favicon"}, true)
if err != nil {
return nil, err
}
childExecuter := opts.Engine.ChildExecuter()
httpclient, err := httpclientpool.Get(opts.ExecuterOpts.Options, &httpclientpool.Configuration{
Connection: &httpclientpool.ConnectionConfiguration{
DisableKeepAlive: httputil.ShouldDisableKeepAlive(opts.ExecuterOpts.Options),
},
})
if err != nil {
return nil, errors.Wrap(err, "could not get http client")
}
return &Service{
opts: opts.ExecuterOpts,
store: opts.Store,
engine: opts.Engine,
target: opts.Target,
wappalyzer: wappalyzer,
templateDirs: templateDirs, // fix this
childExecuter: childExecuter,
httpclient: httpclient,
technologyMappings: mappingData,
techTemplates: techDetectTemplates,
ServiceOpts: opts,
hasResults: &atomic.Bool{},
}, nil
}
// Close closes the service
func (s *Service) Close() bool {
return s.hasResults.Load()
}
// Execute automatic scan on each target with -bs host concurrency
func (s *Service) Execute() error {
gologger.Info().Msgf("Executing Automatic scan on %d target[s]", s.target.Count())
// setup host concurrency
sg := sizedwaitgroup.New(s.opts.Options.BulkSize)
s.target.Iterate(func(value *contextargs.MetaInput) bool {
sg.Add()
go func(input *contextargs.MetaInput) {
defer sg.Done()
s.executeAutomaticScanOnTarget(input)
}(value)
return true
})
sg.Wait()
return nil
}
// executeAutomaticScanOnTarget executes automatic scan on given target
func (s *Service) executeAutomaticScanOnTarget(input *contextargs.MetaInput) {
// get tags using wappalyzer
tagsFromWappalyzer := s.getTagsUsingWappalyzer(input)
// get tags using detection templates
tagsFromDetectTemplates, matched := s.getTagsUsingDetectionTemplates(input)
if matched > 0 {
s.hasResults.Store(true)
}
// create combined final tags
finalTags := []string{}
for _, tags := range append(tagsFromWappalyzer, tagsFromDetectTemplates...) {
if stringsutil.EqualFoldAny(tags, "tech", "waf", "favicon") {
continue
}
finalTags = append(finalTags, tags)
}
finalTags = sliceutil.Dedupe(finalTags)
gologger.Info().Msgf("Found %d tags and %d matches on detection templates on %v [wappalyzer: %d, detection: %d]\n", len(finalTags), matched, input.Input, len(tagsFromWappalyzer), len(tagsFromDetectTemplates))
// also include any extra tags passed by user
finalTags = append(finalTags, s.opts.Options.Tags...)
finalTags = sliceutil.Dedupe(finalTags)
if len(finalTags) == 0 {
gologger.Warning().Msgf("Skipping automatic scan since no tags were found on %v\n", input.Input)
return
}
if s.opts.Options.VerboseVerbose {
gologger.Print().Msgf("Final tags identified for %v: %+v\n", input.Input, finalTags)
}
finalTemplates, err := LoadTemplatesWithTags(s.ServiceOpts, s.templateDirs, finalTags, false)
if err != nil {
gologger.Error().Msgf("%v Error loading templates: %s\n", input.Input, err)
return
}
gologger.Info().Msgf("Executing %d templates on %v", len(finalTemplates), input.Input)
eng := core.New(s.opts.Options)
execOptions := s.opts.Copy()
execOptions.Progress = &testutils.MockProgressClient{} // stats are not supported yet due to centralized logic and cannot be reinitialized
eng.SetExecuterOptions(execOptions)
tmp := eng.ExecuteScanWithOpts(finalTemplates, provider.NewSimpleInputProviderWithUrls(input.Input), true)
s.hasResults.Store(tmp.Load())
}
// getTagsUsingWappalyzer returns tags using wappalyzer by fingerprinting target
// and utilizing the mapping data
func (s *Service) getTagsUsingWappalyzer(input *contextargs.MetaInput) []string {
req, err := retryablehttp.NewRequest(http.MethodGet, input.Input, nil)
if err != nil {
return nil
}
userAgent := useragent.PickRandom()
req.Header.Set("User-Agent", userAgent.Raw)
resp, err := s.httpclient.Do(req)
if err != nil {
return nil
}
defer resp.Body.Close()
data, err := io.ReadAll(io.LimitReader(resp.Body, maxDefaultBody))
if err != nil {
return nil
}
// fingerprint headers and body
fingerprints := s.wappalyzer.Fingerprint(resp.Header, data)
normalized := make(map[string]struct{})
for k := range fingerprints {
normalized[normalizeAppName(k)] = struct{}{}
}
gologger.Verbose().Msgf("Found %d fingerprints for %s\n", len(normalized), input.Input)
// normalize fingerprints using mapping data
for k := range normalized {
// Replace values with mapping data
if value, ok := s.technologyMappings[k]; ok {
delete(normalized, k)
normalized[value] = struct{}{}
}
}
// more post processing
items := make([]string, 0, len(normalized))
for k := range normalized {
if strings.Contains(k, " ") {
parts := strings.Split(strings.ToLower(k), " ")
items = append(items, parts...)
} else {
items = append(items, strings.ToLower(k))
}
}
return sliceutil.Dedupe(items)
}
// getTagsUsingDetectionTemplates returns tags using detection templates
func (s *Service) getTagsUsingDetectionTemplates(input *contextargs.MetaInput) ([]string, int) {
ctxArgs := contextargs.NewWithInput(input.Input)
// execute tech detection templates on target
tags := map[string]struct{}{}
m := &sync.Mutex{}
sg := sizedwaitgroup.New(s.opts.Options.TemplateThreads)
counter := atomic.Uint32{}
for _, t := range s.techTemplates {
sg.Add()
go func(template *templates.Template) {
defer sg.Done()
ctx := scan.NewScanContext(ctxArgs)
ctx.OnResult = func(event *output.InternalWrappedEvent) {
if event == nil {
return
}
if event.HasOperatorResult() {
// match found
// find unique tags
m.Lock()
for _, v := range event.Results {
if v.MatcherName != "" {
tags[v.MatcherName] = struct{}{}
}
for _, tag := range v.Info.Tags.ToSlice() {
// we shouldn't add all tags since tags also contain protocol type tags
// and are not just limited to products or technologies
// ex: tags: js,mssql,detect,network
// A good trick for this is check if tag is present in template-id
if !strings.Contains(template.ID, tag) && !strings.Contains(strings.ToLower(template.Info.Name), tag) {
// unlikely this is relevant
continue
}
if _, ok := tags[tag]; !ok {
tags[tag] = struct{}{}
}
// matcher names are also relevant in tech detection templates (ex: tech-detect)
for k := range event.OperatorsResult.Matches {
if _, ok := tags[k]; !ok {
tags[k] = struct{}{}
}
}
}
}
m.Unlock()
_ = counter.Add(1)
// TBD: should we show or hide tech detection results? what about matcher-status flag?
_ = writer.WriteResult(event, s.opts.Output, s.opts.Progress, s.opts.IssuesClient)
}
}
_, err := template.Executer.ExecuteWithResults(ctx)
if err != nil {
gologger.Verbose().Msgf("[%s] error executing template: %s\n", aurora.BrightYellow(template.ID), err)
return
}
}(t)
}
sg.Wait()
return mapsutil.GetKeys(tags), int(counter.Load())
}
// normalizeAppName normalizes app name
func normalizeAppName(appName string) string {
if strings.Contains(appName, ":") {
if parts := strings.Split(appName, ":"); len(parts) == 2 {
appName = parts[0]
}
}
return strings.ToLower(appName)
}