crawler

package
v0.6.0 Latest Latest
Warning

This package is not in the latest version of its module.

Go to latest
Published: Apr 14, 2026 License: MIT Imports: 31 Imported by: 0

Documentation

Index

Constants

This section is empty.

Variables

This section is empty.

Functions

This section is empty.

Types

type CrawlOptions

type CrawlOptions struct {
	URL               string
	Depth             int
	UserAgent         string
	Verbose           bool
	Offsite           bool
	WithNumbers       bool
	ExtractEmails     bool
	ExtractMeta       bool
	CapturePaths      bool
	CaptureSubdomains bool
	CaptureDomain     bool
	MaxPages          int
	Threads           int
	MaxContext        int
	NoCache           bool
	CacheTTL          time.Duration
	MaxFiles          int
	ExtractSecrets    bool
	ProxyURL          string
	AuthType          string
	AuthUser          string
	AuthPass          string
	Headers           []string
	ExcludePaths      []string
	DumpDir           string
}

type CrawlResult

type CrawlResult struct {
	Words    []string
	Emails   []string
	Metadata []string
	Secrets  []string
	Context  string
	URL      string
	Title    string
	Pages    int
}

func Crawl

func Crawl(ctx context.Context, opts CrawlOptions) (*CrawlResult, error)

type Source added in v0.4.0

type Source interface {
	Crawl(ctx context.Context, opts CrawlOptions) (*CrawlResult, error)
}

func NewSource added in v0.4.0

func NewSource(targetURL string) (Source, error)

Directories

Path Synopsis

Jump to

Keyboard shortcuts

? : This menu
/ : Search site
f or F : Jump to
y or Y : Canonical URL