Documentation
¶
Index ¶
- Constants
- Variables
- func NewWhisperCppLoader(filename string) *whisperCppLoader
- type CSVLoader
- type DirectoryLoader
- type HFImageToText
- type HFSpeechRecognition
- func (h *HFSpeechRecognition) Load(ctx context.Context) ([]document.Document, error)
- func (h *HFSpeechRecognition) WithModel(model string) *HFSpeechRecognition
- func (h *HFSpeechRecognition) WithTextSplitter(textSplitter TextSplitter) *HFSpeechRecognition
- func (h *HFSpeechRecognition) WithToken(token string) *HFSpeechRecognition
- type LibreOfficeLoader
- func (l *LibreOfficeLoader) Load(ctx context.Context) ([]document.Document, error)
- func (l *LibreOfficeLoader) WithArgs(libreOfficeArgs []string) *LibreOfficeLoader
- func (l *LibreOfficeLoader) WithLibreOfficePath(libreOfficePath string) *LibreOfficeLoader
- func (l *LibreOfficeLoader) WithTextSplitter(textSplitter TextSplitter) *LibreOfficeLoader
- type Loader
- type PDFLoader
- type PubMedLoader
- type TesseractLoader
- func (l *TesseractLoader) Load(ctx context.Context) ([]document.Document, error)
- func (l *TesseractLoader) WithArgs(tesseractArgs []string) *TesseractLoader
- func (l *TesseractLoader) WithTesseractPath(tesseractPath string) *TesseractLoader
- func (l *TesseractLoader) WithTextSplitter(textSplitter TextSplitter) *TesseractLoader
- type TextLoader
- type TextSplitter
- type WhisperLoader
Constants ¶
View Source
const (
SourceMetadataKey = "source"
)
Variables ¶
View Source
var (
ErrLibreOfficeNotFound = fmt.Errorf("pdftotext not found")
)
View Source
var (
ErrPdfToTextNotFound = fmt.Errorf("pdftotext not found")
)
View Source
var (
ErrTesseractNotFound = fmt.Errorf("pdftotext not found")
)
View Source
var (
ErrorInternal = fmt.Errorf("internal error")
)
Functions ¶
func NewWhisperCppLoader ¶ added in v0.0.6
func NewWhisperCppLoader(filename string) *whisperCppLoader
Types ¶
type CSVLoader ¶ added in v0.0.9
type CSVLoader struct {
// contains filtered or unexported fields
}
func NewCSVLoader ¶ added in v0.0.6
func (*CSVLoader) WithLazyQuotes ¶ added in v0.0.9
func (*CSVLoader) WithSeparator ¶ added in v0.0.9
func (*CSVLoader) WithTextSplitter ¶ added in v0.0.9
func (t *CSVLoader) WithTextSplitter(textSplitter TextSplitter) *CSVLoader
type DirectoryLoader ¶
type DirectoryLoader struct {
// contains filtered or unexported fields
}
func NewDirectoryLoader ¶
func NewDirectoryLoader(dirname string, regExPathMatch string) *DirectoryLoader
func (*DirectoryLoader) WithTextSplitter ¶ added in v0.0.9
func (d *DirectoryLoader) WithTextSplitter(textSplitter TextSplitter) *DirectoryLoader
type HFImageToText ¶ added in v0.0.9
type HFImageToText struct {
// contains filtered or unexported fields
}
func NewHFImageToTextLoader ¶ added in v0.0.7
func NewHFImageToTextLoader(mediaFile string) *HFImageToText
func (*HFImageToText) WithModel ¶ added in v0.0.9
func (h *HFImageToText) WithModel(model string) *HFImageToText
func (*HFImageToText) WithTextSplitter ¶ added in v0.0.9
func (h *HFImageToText) WithTextSplitter(textSplitter TextSplitter) *HFImageToText
func (*HFImageToText) WithToken ¶ added in v0.0.9
func (h *HFImageToText) WithToken(token string) *HFImageToText
type HFSpeechRecognition ¶ added in v0.0.9
type HFSpeechRecognition struct {
// contains filtered or unexported fields
}
func NewHFSpeechRecognitionLoader ¶ added in v0.0.7
func NewHFSpeechRecognitionLoader(mediaFile string) *HFSpeechRecognition
func (*HFSpeechRecognition) WithModel ¶ added in v0.0.9
func (h *HFSpeechRecognition) WithModel(model string) *HFSpeechRecognition
func (*HFSpeechRecognition) WithTextSplitter ¶ added in v0.0.9
func (h *HFSpeechRecognition) WithTextSplitter(textSplitter TextSplitter) *HFSpeechRecognition
func (*HFSpeechRecognition) WithToken ¶ added in v0.0.9
func (h *HFSpeechRecognition) WithToken(token string) *HFSpeechRecognition
type LibreOfficeLoader ¶ added in v0.0.9
type LibreOfficeLoader struct {
// contains filtered or unexported fields
}
func NewLibreOfficeLoader ¶ added in v0.0.6
func NewLibreOfficeLoader(filename string) *LibreOfficeLoader
func (*LibreOfficeLoader) WithArgs ¶ added in v0.0.9
func (l *LibreOfficeLoader) WithArgs(libreOfficeArgs []string) *LibreOfficeLoader
func (*LibreOfficeLoader) WithLibreOfficePath ¶ added in v0.0.9
func (l *LibreOfficeLoader) WithLibreOfficePath(libreOfficePath string) *LibreOfficeLoader
func (*LibreOfficeLoader) WithTextSplitter ¶ added in v0.0.9
func (l *LibreOfficeLoader) WithTextSplitter(textSplitter TextSplitter) *LibreOfficeLoader
type PDFLoader ¶ added in v0.0.9
type PDFLoader struct {
// contains filtered or unexported fields
}
func NewPDFToTextLoader ¶ added in v0.0.4
func (*PDFLoader) WithPDFToTextPath ¶ added in v0.0.9
func (*PDFLoader) WithTextSplitter ¶ added in v0.0.9
func (p *PDFLoader) WithTextSplitter(textSplitter TextSplitter) *PDFLoader
type PubMedLoader ¶ added in v0.0.9
type PubMedLoader struct {
// contains filtered or unexported fields
}
func NewPubmedLoader ¶ added in v0.0.4
func NewPubmedLoader(pubMedIDs []string) *PubMedLoader
func (*PubMedLoader) WithTextSplitter ¶ added in v0.0.9
func (p *PubMedLoader) WithTextSplitter(textSplitter TextSplitter) *PubMedLoader
type TesseractLoader ¶ added in v0.0.9
type TesseractLoader struct {
// contains filtered or unexported fields
}
func NewTesseractLoader ¶ added in v0.0.7
func NewTesseractLoader(filename string) *TesseractLoader
func (*TesseractLoader) WithArgs ¶ added in v0.0.9
func (l *TesseractLoader) WithArgs(tesseractArgs []string) *TesseractLoader
func (*TesseractLoader) WithTesseractPath ¶ added in v0.0.9
func (l *TesseractLoader) WithTesseractPath(tesseractPath string) *TesseractLoader
func (*TesseractLoader) WithTextSplitter ¶ added in v0.0.9
func (l *TesseractLoader) WithTextSplitter(textSplitter TextSplitter) *TesseractLoader
type TextLoader ¶
type TextLoader struct {
// contains filtered or unexported fields
}
func NewTextLoader ¶
func NewTextLoader(filename string, metadata types.Meta) *TextLoader
func (*TextLoader) WithTextSplitter ¶ added in v0.0.9
func (t *TextLoader) WithTextSplitter(textSplitter TextSplitter) *TextLoader
type TextSplitter ¶ added in v0.0.5
type WhisperLoader ¶ added in v0.0.9
type WhisperLoader struct {
// contains filtered or unexported fields
}
func NewWhisperLoader ¶ added in v0.0.6
func NewWhisperLoader(filename string) *WhisperLoader
func (*WhisperLoader) WithClient ¶ added in v0.0.9
func (w *WhisperLoader) WithClient(client *openai.Client) *WhisperLoader
Click to show internal directories.
Click to hide internal directories.