Documentation
¶
Index ¶
Constants ¶
This section is empty.
Variables ¶
This section is empty.
Functions ¶
This section is empty.
Types ¶
type DefaultExtractor ¶
type DefaultExtractor struct {
HTTPClient httputils.HTTPClient
Filters htmlselector.OptimizedFilterGroup
LinkTransformer models.LinkTransformer
}
DefaultExtractor ...
func (DefaultExtractor) ExtractLinks ¶
func (extractor DefaultExtractor) ExtractLinks( ctx context.Context, threadID int, link string, ) ([]string, error)
ExtractLinks ...
type DelayingExtractor ¶
type DelayingExtractor struct {
// contains filtered or unexported fields
}
DelayingExtractor ...
func NewDelayingExtractor ¶
func NewDelayingExtractor( minimalDelay time.Duration, sleeper SleepHandler, linkExtractor models.LinkExtractor, ) *DelayingExtractor
NewDelayingExtractor ...
func (*DelayingExtractor) ExtractLinks ¶
func (extractor *DelayingExtractor) ExtractLinks( ctx context.Context, threadID int, link string, ) ([]string, error)
ExtractLinks ...
type ExtractorGroup ¶ added in v1.7.1
type ExtractorGroup struct {
Name string
LinkExtractors []models.LinkExtractor
Logger log.Logger
}
ExtractorGroup ...
func (ExtractorGroup) ExtractLinks ¶ added in v1.7.1
func (extractors ExtractorGroup) ExtractLinks( ctx context.Context, threadID int, link string, ) ([]string, error)
ExtractLinks ...
type HTTPClient ¶
type HTTPClient interface {
httputils.HTTPClient
}
HTTPClient ...
It's used only for mock generating.
type LinkExtractor ¶
type LinkExtractor interface {
models.LinkExtractor
}
LinkExtractor ...
It's used only for mock generating.
type LinkTransformer ¶ added in v1.11.1
type LinkTransformer interface {
models.LinkTransformer
}
LinkTransformer ...
It's used only for mock generating.
type RepeatingExtractor ¶
type RepeatingExtractor struct {
LinkExtractor models.LinkExtractor
RepeatCount int
RepeatDelay time.Duration
Logger log.Logger
SleepHandler SleepHandler
}
RepeatingExtractor ...
func (RepeatingExtractor) ExtractLinks ¶
func (extractor RepeatingExtractor) ExtractLinks( ctx context.Context, threadID int, link string, ) ([]string, error)
ExtractLinks ...
type SitemapExtractor ¶ added in v1.7.1
type SitemapExtractor struct {
SitemapRegister registers.SitemapRegister
Logger log.Logger
}
SitemapExtractor ...
func (SitemapExtractor) ExtractLinks ¶ added in v1.7.1
func (extractor SitemapExtractor) ExtractLinks( ctx context.Context, threadID int, link string, ) ([]string, error)
ExtractLinks ...
type TrimmingExtractor ¶ added in v1.10.1
type TrimmingExtractor struct {
TrimLink urlutils.LinkTrimming
LinkExtractor models.LinkExtractor
}
TrimmingExtractor ...
func (TrimmingExtractor) ExtractLinks ¶ added in v1.10.1
func (extractor TrimmingExtractor) ExtractLinks( ctx context.Context, threadID int, link string, ) ([]string, error)
ExtractLinks ...
Source Files
¶
Click to show internal directories.
Click to hide internal directories.