mirror of
https://github.com/projectdiscovery/nuclei.git
synced 2025-12-17 18:05:27 +00:00
* spelling: addresses Signed-off-by: Josh Soref <2119212+jsoref@users.noreply.github.com> * spelling: asynchronous Signed-off-by: Josh Soref <2119212+jsoref@users.noreply.github.com> * spelling: basic Signed-off-by: Josh Soref <2119212+jsoref@users.noreply.github.com> * spelling: brute force Signed-off-by: Josh Soref <2119212+jsoref@users.noreply.github.com> * spelling: constant Signed-off-by: Josh Soref <2119212+jsoref@users.noreply.github.com> * spelling: disables Signed-off-by: Josh Soref <2119212+jsoref@users.noreply.github.com> * spelling: engine Signed-off-by: Josh Soref <2119212+jsoref@users.noreply.github.com> * spelling: every time Signed-off-by: Josh Soref <2119212+jsoref@users.noreply.github.com> * spelling: execution Signed-off-by: Josh Soref <2119212+jsoref@users.noreply.github.com> * spelling: false positives Signed-off-by: Josh Soref <2119212+jsoref@users.noreply.github.com> * spelling: from Signed-off-by: Josh Soref <2119212+jsoref@users.noreply.github.com> * spelling: further Signed-off-by: Josh Soref <2119212+jsoref@users.noreply.github.com> * spelling: github Signed-off-by: Josh Soref <2119212+jsoref@users.noreply.github.com> * spelling: gitlab Signed-off-by: Josh Soref <2119212+jsoref@users.noreply.github.com> * spelling: highlight Signed-off-by: Josh Soref <2119212+jsoref@users.noreply.github.com> * spelling: hygiene Signed-off-by: Josh Soref <2119212+jsoref@users.noreply.github.com> * spelling: ignore Signed-off-by: Josh Soref <2119212+jsoref@users.noreply.github.com> * spelling: input Signed-off-by: Josh Soref <2119212+jsoref@users.noreply.github.com> * spelling: item Signed-off-by: Josh Soref <2119212+jsoref@users.noreply.github.com> * spelling: itself Signed-off-by: Josh Soref <2119212+jsoref@users.noreply.github.com> * spelling: latestxxx Signed-off-by: Josh Soref <2119212+jsoref@users.noreply.github.com> * spelling: navigation Signed-off-by: Josh Soref <2119212+jsoref@users.noreply.github.com> * spelling: negative Signed-off-by: Josh Soref <2119212+jsoref@users.noreply.github.com> * spelling: nonexistent Signed-off-by: Josh Soref <2119212+jsoref@users.noreply.github.com> * spelling: occurred Signed-off-by: Josh Soref <2119212+jsoref@users.noreply.github.com> * spelling: override Signed-off-by: Josh Soref <2119212+jsoref@users.noreply.github.com> * spelling: overrides Signed-off-by: Josh Soref <2119212+jsoref@users.noreply.github.com> * spelling: payload Signed-off-by: Josh Soref <2119212+jsoref@users.noreply.github.com> * spelling: performed Signed-off-by: Josh Soref <2119212+jsoref@users.noreply.github.com> * spelling: respective Signed-off-by: Josh Soref <2119212+jsoref@users.noreply.github.com> * spelling: retrieve Signed-off-by: Josh Soref <2119212+jsoref@users.noreply.github.com> * spelling: scanlist Signed-off-by: Josh Soref <2119212+jsoref@users.noreply.github.com> * spelling: separated Signed-off-by: Josh Soref <2119212+jsoref@users.noreply.github.com> * spelling: separator Signed-off-by: Josh Soref <2119212+jsoref@users.noreply.github.com> * spelling: severity Signed-off-by: Josh Soref <2119212+jsoref@users.noreply.github.com> * spelling: source Signed-off-by: Josh Soref <2119212+jsoref@users.noreply.github.com> * spelling: strategy Signed-off-by: Josh Soref <2119212+jsoref@users.noreply.github.com> * spelling: string Signed-off-by: Josh Soref <2119212+jsoref@users.noreply.github.com> * spelling: templates Signed-off-by: Josh Soref <2119212+jsoref@users.noreply.github.com> * spelling: terminal Signed-off-by: Josh Soref <2119212+jsoref@users.noreply.github.com> * spelling: timeout Signed-off-by: Josh Soref <2119212+jsoref@users.noreply.github.com> * spelling: trailing slash Signed-off-by: Josh Soref <2119212+jsoref@users.noreply.github.com> * spelling: trailing Signed-off-by: Josh Soref <2119212+jsoref@users.noreply.github.com> * spelling: websocket Signed-off-by: Josh Soref <2119212+jsoref@users.noreply.github.com> --------- Signed-off-by: Josh Soref <2119212+jsoref@users.noreply.github.com>
349 lines
9.3 KiB
Go
349 lines
9.3 KiB
Go
// Package hybrid implements a hybrid hmap/filekv backed input provider
|
|
// for nuclei that can either stream or store results using different kv stores.
|
|
package hybrid
|
|
|
|
import (
|
|
"bufio"
|
|
"context"
|
|
"fmt"
|
|
"io"
|
|
"os"
|
|
"strings"
|
|
"sync"
|
|
"time"
|
|
|
|
"github.com/pkg/errors"
|
|
|
|
"github.com/projectdiscovery/gologger"
|
|
"github.com/projectdiscovery/hmap/filekv"
|
|
"github.com/projectdiscovery/hmap/store/hybrid"
|
|
"github.com/projectdiscovery/mapcidr"
|
|
"github.com/projectdiscovery/mapcidr/asn"
|
|
"github.com/projectdiscovery/nuclei/v2/pkg/protocols/common/contextargs"
|
|
"github.com/projectdiscovery/nuclei/v2/pkg/protocols/common/protocolstate"
|
|
"github.com/projectdiscovery/nuclei/v2/pkg/protocols/common/uncover"
|
|
"github.com/projectdiscovery/nuclei/v2/pkg/types"
|
|
uncoverlib "github.com/projectdiscovery/uncover"
|
|
fileutil "github.com/projectdiscovery/utils/file"
|
|
iputil "github.com/projectdiscovery/utils/ip"
|
|
readerutil "github.com/projectdiscovery/utils/reader"
|
|
sliceutil "github.com/projectdiscovery/utils/slice"
|
|
urlutil "github.com/projectdiscovery/utils/url"
|
|
)
|
|
|
|
const DefaultMaxDedupeItemsCount = 10000
|
|
|
|
// Input is a hmap/filekv backed nuclei Input provider
|
|
type Input struct {
|
|
ipOptions *ipOptions
|
|
inputCount int64
|
|
dupeCount int64
|
|
hostMap *hybrid.HybridMap
|
|
hostMapStream *filekv.FileDB
|
|
hostMapStreamOnce sync.Once
|
|
sync.Once
|
|
}
|
|
|
|
// Options is a wrapper around types.Options structure
|
|
type Options struct {
|
|
// Options contains options for hmap provider
|
|
Options *types.Options
|
|
// NotFoundCallback is called for each not found target
|
|
// This overrides error handling for not found target
|
|
NotFoundCallback func(template string) bool
|
|
}
|
|
|
|
// New creates a new hmap backed nuclei Input Provider
|
|
// and initializes it based on the passed options Model.
|
|
func New(opts *Options) (*Input, error) {
|
|
options := opts.Options
|
|
|
|
hm, err := hybrid.New(hybrid.DefaultDiskOptions)
|
|
if err != nil {
|
|
return nil, errors.Wrap(err, "could not create temporary input file")
|
|
}
|
|
|
|
input := &Input{
|
|
hostMap: hm,
|
|
ipOptions: &ipOptions{
|
|
ScanAllIPs: options.ScanAllIPs,
|
|
IPV4: sliceutil.Contains(options.IPVersion, "4"),
|
|
IPV6: sliceutil.Contains(options.IPVersion, "6"),
|
|
},
|
|
}
|
|
if options.Stream {
|
|
fkvOptions := filekv.DefaultOptions
|
|
fkvOptions.MaxItems = DefaultMaxDedupeItemsCount
|
|
if tmpFileName, err := fileutil.GetTempFileName(); err != nil {
|
|
return nil, errors.Wrap(err, "could not create temporary input file")
|
|
} else {
|
|
fkvOptions.Path = tmpFileName
|
|
}
|
|
fkv, err := filekv.Open(fkvOptions)
|
|
if err != nil {
|
|
return nil, errors.Wrap(err, "could not create temporary unsorted input file")
|
|
}
|
|
input.hostMapStream = fkv
|
|
}
|
|
if initErr := input.initializeInputSources(opts); initErr != nil {
|
|
return nil, initErr
|
|
}
|
|
if input.dupeCount > 0 {
|
|
gologger.Info().Msgf("Supplied input was automatically deduplicated (%d removed).", input.dupeCount)
|
|
}
|
|
return input, nil
|
|
}
|
|
|
|
// Close closes the input provider
|
|
func (i *Input) Close() {
|
|
i.hostMap.Close()
|
|
if i.hostMapStream != nil {
|
|
i.hostMapStream.Close()
|
|
}
|
|
}
|
|
|
|
// initializeInputSources initializes the input sources for hmap input
|
|
func (i *Input) initializeInputSources(opts *Options) error {
|
|
options := opts.Options
|
|
|
|
// Handle targets flags
|
|
for _, target := range options.Targets {
|
|
switch {
|
|
case iputil.IsCIDR(target):
|
|
i.expandCIDRInputValue(target)
|
|
case asn.IsASN(target):
|
|
i.expandASNInputValue(target)
|
|
default:
|
|
i.Set(target)
|
|
}
|
|
}
|
|
|
|
// Handle stdin
|
|
if options.Stdin {
|
|
i.scanInputFromReader(readerutil.TimeoutReader{Reader: os.Stdin, Timeout: time.Duration(options.InputReadTimeout)})
|
|
}
|
|
|
|
// Handle target file
|
|
if options.TargetsFilePath != "" {
|
|
input, inputErr := os.Open(options.TargetsFilePath)
|
|
if inputErr != nil {
|
|
// Handle cloud based input here.
|
|
if opts.NotFoundCallback == nil || !opts.NotFoundCallback(options.TargetsFilePath) {
|
|
return errors.Wrap(inputErr, "could not open targets file")
|
|
}
|
|
}
|
|
if input != nil {
|
|
i.scanInputFromReader(input)
|
|
input.Close()
|
|
}
|
|
}
|
|
if options.Uncover && options.UncoverQuery != nil {
|
|
gologger.Info().Msgf("Running uncover query against: %s", strings.Join(options.UncoverEngine, ","))
|
|
uncoverOpts := &uncoverlib.Options{
|
|
Agents: options.UncoverEngine,
|
|
Queries: options.UncoverQuery,
|
|
Limit: options.UncoverLimit,
|
|
MaxRetry: options.Retries,
|
|
Timeout: options.Timeout,
|
|
RateLimit: uint(options.UncoverRateLimit),
|
|
RateLimitUnit: time.Minute, // default unit is minute
|
|
}
|
|
ch, err := uncover.GetTargetsFromUncover(context.TODO(), options.UncoverField, uncoverOpts)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
for c := range ch {
|
|
i.Set(c)
|
|
}
|
|
}
|
|
return nil
|
|
}
|
|
|
|
// scanInputFromReader scans a line of input from reader and passes it for storage
|
|
func (i *Input) scanInputFromReader(reader io.Reader) {
|
|
scanner := bufio.NewScanner(reader)
|
|
for scanner.Scan() {
|
|
item := scanner.Text()
|
|
switch {
|
|
case iputil.IsCIDR(item):
|
|
i.expandCIDRInputValue(item)
|
|
case asn.IsASN(item):
|
|
i.expandASNInputValue(item)
|
|
default:
|
|
i.Set(item)
|
|
}
|
|
}
|
|
}
|
|
|
|
// Set normalizes and stores passed input values
|
|
func (i *Input) Set(value string) {
|
|
URL := strings.TrimSpace(value)
|
|
if URL == "" {
|
|
return
|
|
}
|
|
// parse hostname if url is given
|
|
urlx, err := urlutil.Parse(URL)
|
|
if err != nil || (urlx != nil && urlx.Host == "") {
|
|
gologger.Debug().Label("url").MsgFunc(func() string {
|
|
if err != nil {
|
|
return fmt.Sprintf("failed to parse url %v got %v skipping ip selection", URL, err)
|
|
}
|
|
return fmt.Sprintf("got empty hostname for %v skipping ip selection", URL)
|
|
})
|
|
metaInput := &contextargs.MetaInput{Input: URL}
|
|
i.setItem(metaInput)
|
|
return
|
|
}
|
|
|
|
// Check if input is ip or hostname
|
|
if iputil.IsIP(urlx.Hostname()) {
|
|
metaInput := &contextargs.MetaInput{Input: URL}
|
|
i.setItem(metaInput)
|
|
return
|
|
}
|
|
|
|
if i.ipOptions.ScanAllIPs {
|
|
// scan all ips
|
|
dnsData, err := protocolstate.Dialer.GetDNSData(urlx.Hostname())
|
|
if err == nil {
|
|
if (len(dnsData.A) + len(dnsData.AAAA)) > 0 {
|
|
var ips []string
|
|
if i.ipOptions.IPV4 {
|
|
ips = append(ips, dnsData.A...)
|
|
}
|
|
if i.ipOptions.IPV6 {
|
|
ips = append(ips, dnsData.AAAA...)
|
|
}
|
|
for _, ip := range ips {
|
|
if ip == "" {
|
|
continue
|
|
}
|
|
metaInput := &contextargs.MetaInput{Input: value, CustomIP: ip}
|
|
i.setItem(metaInput)
|
|
}
|
|
return
|
|
} else {
|
|
gologger.Debug().Msgf("scanAllIps: no ip's found reverting to default")
|
|
}
|
|
} else {
|
|
// failed to scanallips falling back to defaults
|
|
gologger.Debug().Msgf("scanAllIps: dns resolution failed: %v", err)
|
|
}
|
|
}
|
|
|
|
ips := []string{}
|
|
// only scan the target but ipv6 if it has one
|
|
if i.ipOptions.IPV6 {
|
|
dnsData, err := protocolstate.Dialer.GetDNSData(urlx.Hostname())
|
|
if err == nil && len(dnsData.AAAA) > 0 {
|
|
// pick/ prefer 1st
|
|
ips = append(ips, dnsData.AAAA[0])
|
|
} else {
|
|
gologger.Warning().Msgf("target does not have ipv6 address falling back to ipv4 %v\n", err)
|
|
}
|
|
}
|
|
if i.ipOptions.IPV4 {
|
|
// if IPV4 is enabled do not specify ip let dialer handle it
|
|
ips = append(ips, "")
|
|
}
|
|
|
|
for _, ip := range ips {
|
|
if ip != "" {
|
|
metaInput := &contextargs.MetaInput{Input: URL, CustomIP: ip}
|
|
i.setItem(metaInput)
|
|
} else {
|
|
metaInput := &contextargs.MetaInput{Input: URL}
|
|
i.setItem(metaInput)
|
|
}
|
|
}
|
|
}
|
|
|
|
// setItem in the kv store
|
|
func (i *Input) setItem(metaInput *contextargs.MetaInput) {
|
|
key, err := metaInput.MarshalString()
|
|
if err != nil {
|
|
gologger.Warning().Msgf("%s\n", err)
|
|
return
|
|
}
|
|
if _, ok := i.hostMap.Get(key); ok {
|
|
i.dupeCount++
|
|
return
|
|
}
|
|
|
|
i.inputCount++ // tracks target count
|
|
_ = i.hostMap.Set(key, nil)
|
|
if i.hostMapStream != nil {
|
|
i.setHostMapStream(key)
|
|
}
|
|
}
|
|
|
|
// setHostMapStream sets item in stream mode
|
|
func (i *Input) setHostMapStream(data string) {
|
|
if _, err := i.hostMapStream.Merge([][]byte{[]byte(data)}); err != nil {
|
|
gologger.Warning().Msgf("%s\n", err)
|
|
return
|
|
}
|
|
}
|
|
|
|
// Count returns the input count
|
|
func (i *Input) Count() int64 {
|
|
return i.inputCount
|
|
}
|
|
|
|
// Scan iterates the input and each found item is passed to the
|
|
// callback consumer.
|
|
func (i *Input) Scan(callback func(value *contextargs.MetaInput) bool) {
|
|
if i.hostMapStream != nil {
|
|
i.hostMapStreamOnce.Do(func() {
|
|
if err := i.hostMapStream.Process(); err != nil {
|
|
gologger.Warning().Msgf("error in stream mode processing: %s\n", err)
|
|
}
|
|
})
|
|
}
|
|
callbackFunc := func(k, _ []byte) error {
|
|
metaInput := &contextargs.MetaInput{}
|
|
if err := metaInput.Unmarshal(string(k)); err != nil {
|
|
return err
|
|
}
|
|
if !callback(metaInput) {
|
|
return io.EOF
|
|
}
|
|
return nil
|
|
}
|
|
if i.hostMapStream != nil {
|
|
_ = i.hostMapStream.Scan(callbackFunc)
|
|
} else {
|
|
i.hostMap.Scan(callbackFunc)
|
|
}
|
|
}
|
|
|
|
// expandCIDRInputValue expands CIDR and stores expanded IPs
|
|
func (i *Input) expandCIDRInputValue(value string) {
|
|
ips, _ := mapcidr.IPAddressesAsStream(value)
|
|
for ip := range ips {
|
|
metaInput := &contextargs.MetaInput{Input: ip}
|
|
key, err := metaInput.MarshalString()
|
|
if err != nil {
|
|
gologger.Warning().Msgf("%s\n", err)
|
|
return
|
|
}
|
|
if _, ok := i.hostMap.Get(key); ok {
|
|
i.dupeCount++
|
|
continue
|
|
}
|
|
i.inputCount++
|
|
_ = i.hostMap.Set(key, nil)
|
|
if i.hostMapStream != nil {
|
|
i.setHostMapStream(key)
|
|
}
|
|
}
|
|
}
|
|
|
|
// expandASNInputValue expands CIDRs for given ASN and stores expanded IPs
|
|
func (i *Input) expandASNInputValue(value string) {
|
|
cidrs, _ := asn.GetCIDRsForASNNum(value)
|
|
for _, cidr := range cidrs {
|
|
i.expandCIDRInputValue(cidr.String())
|
|
}
|
|
}
|