Documentation
¶
Index ¶
Constants ¶
This section is empty.
Variables ¶
This section is empty.
Functions ¶
This section is empty.
Types ¶
type BrowserConfig ¶
type BrowserConfig struct {
Default string `toml:"default"`
Paths map[string]string `toml:"paths"`
Cookies BrowserCookiesConfig `toml:"cookies"`
}
type BrowserCookiesConfig ¶
type Config ¶
type Config struct {
Schema string `toml:"$schema,omitempty" mapstructure:"$schema"`
Browser BrowserConfig `toml:"browser" mapstructure:"browser"`
Extraction ExtractionConfig `toml:"extraction" mapstructure:"extraction"`
Output OutputConfig `toml:"output" mapstructure:"output"`
Network NetworkConfig `toml:"network" mapstructure:"network"`
Parallel ParallelConfig `toml:"parallel" mapstructure:"parallel"`
Pipe PipeConfig `toml:"pipe" mapstructure:"pipe"`
Logging LoggingConfig `toml:"logging" mapstructure:"logging"`
}
func (*Config) CreateExampleConfig ¶
type ExtractionConfig ¶
type ExtractionConfig struct {
SkipCookieBanners bool `toml:"skip_cookie_banners"`
BannerTimeout int `toml:"banner_timeout"`
EnableJavaScript string `toml:"enable_javascript"`
JSTimeout int `toml:"js_timeout"`
WaitForSelector string `toml:"wait_for_selector"`
MinContentLength int `toml:"min_content_length"`
RemoveAds bool `toml:"remove_ads"`
CleanHTML bool `toml:"clean_html"`
Backend string `toml:"backend"` // readability (default), tavily, jina
// Tavily extraction settings
Tavily TavilyExtractionConfig `toml:"tavily"`
// Jina extraction settings
Jina JinaExtractionConfig `toml:"jina"`
}
type JinaExtractionConfig ¶
type JinaExtractionConfig struct {
APIKey string `toml:"api_key"` // optional, for higher rate limits
}
JinaExtractionConfig holds Jina Reader API settings
type LoggingConfig ¶
type NetworkConfig ¶
type OutputConfig ¶
type ParallelConfig ¶
type PipeConfig ¶
type TavilyExtractionConfig ¶
type TavilyExtractionConfig struct {
APIKey string `toml:"api_key"`
ExtractDepth string `toml:"extract_depth"` // basic or advanced
}
TavilyExtractionConfig holds Tavily Extract API settings
Click to show internal directories.
Click to hide internal directories.