Documentation
¶
Index ¶
- type ContentProcessor
- func (cp *ContentProcessor) CleanNewlines(text string) string
- func (cp *ContentProcessor) Process(html, url string, opts ProcessOptions) (*ProcessedContent, error)
- func (cp *ContentProcessor) ProcessFromReader(r io.Reader, url string, opts ProcessOptions) (*ProcessedContent, error)
- func (cp *ContentProcessor) ToMarkdown(content *ProcessedContent, includeMetadata bool, preserveLinks bool) string
- func (cp *ContentProcessor) ToText(content *ProcessedContent, lineWidth int) string
- type Link
- type ProcessOptions
- type ProcessedContent
Constants ¶
This section is empty.
Variables ¶
This section is empty.
Functions ¶
This section is empty.
Types ¶
type ContentProcessor ¶
type ContentProcessor struct {
}
func NewContentProcessor ¶
func NewContentProcessor() *ContentProcessor
func (*ContentProcessor) CleanNewlines ¶
func (cp *ContentProcessor) CleanNewlines(text string) string
CleanNewlines removes unwanted newlines that break up sentences
func (*ContentProcessor) Process ¶
func (cp *ContentProcessor) Process(html, url string, opts ProcessOptions) (*ProcessedContent, error)
func (*ContentProcessor) ProcessFromReader ¶
func (cp *ContentProcessor) ProcessFromReader(r io.Reader, url string, opts ProcessOptions) (*ProcessedContent, error)
func (*ContentProcessor) ToMarkdown ¶
func (cp *ContentProcessor) ToMarkdown(content *ProcessedContent, includeMetadata bool, preserveLinks bool) string
func (*ContentProcessor) ToText ¶
func (cp *ContentProcessor) ToText(content *ProcessedContent, lineWidth int) string
type ProcessOptions ¶
Click to show internal directories.
Click to hide internal directories.