Documentation
¶
Index ¶
- Variables
- func RegisterBackendServer(s grpc.ServiceRegistrar, srv BackendServer)
- type BackendClient
- type BackendServer
- type Backend_PredictStreamClient
- type Backend_PredictStreamServer
- type EmbeddingResult
- type GenerateImageRequest
- func (*GenerateImageRequest) Descriptor() ([]byte, []int)deprecated
- func (x *GenerateImageRequest) GetDst() string
- func (x *GenerateImageRequest) GetHeight() int32
- func (x *GenerateImageRequest) GetMode() int32
- func (x *GenerateImageRequest) GetNegativePrompt() string
- func (x *GenerateImageRequest) GetPositivePrompt() string
- func (x *GenerateImageRequest) GetSeed() int32
- func (x *GenerateImageRequest) GetStep() int32
- func (x *GenerateImageRequest) GetWidth() int32
- func (*GenerateImageRequest) ProtoMessage()
- func (x *GenerateImageRequest) ProtoReflect() protoreflect.Message
- func (x *GenerateImageRequest) Reset()
- func (x *GenerateImageRequest) String() string
- type HealthMessage
- type ModelOptions
- func (*ModelOptions) Descriptor() ([]byte, []int)deprecated
- func (x *ModelOptions) GetContextSize() int32
- func (x *ModelOptions) GetEmbeddings() bool
- func (x *ModelOptions) GetF16Memory() bool
- func (x *ModelOptions) GetLibrarySearchPath() string
- func (x *ModelOptions) GetLowVRAM() bool
- func (x *ModelOptions) GetMLock() bool
- func (x *ModelOptions) GetMMap() bool
- func (x *ModelOptions) GetMainGPU() string
- func (x *ModelOptions) GetModel() string
- func (x *ModelOptions) GetNBatch() int32
- func (x *ModelOptions) GetNGPULayers() int32
- func (x *ModelOptions) GetNGQA() int32
- func (x *ModelOptions) GetNUMA() bool
- func (x *ModelOptions) GetRMSNormEps() float32
- func (x *ModelOptions) GetRopeFreqBase() float32
- func (x *ModelOptions) GetRopeFreqScale() float32
- func (x *ModelOptions) GetSeed() int32
- func (x *ModelOptions) GetTensorSplit() string
- func (x *ModelOptions) GetThreads() int32
- func (x *ModelOptions) GetVocabOnly() bool
- func (*ModelOptions) ProtoMessage()
- func (x *ModelOptions) ProtoReflect() protoreflect.Message
- func (x *ModelOptions) Reset()
- func (x *ModelOptions) String() string
- type PredictOptions
- func (*PredictOptions) Descriptor() ([]byte, []int)deprecated
- func (x *PredictOptions) GetBatch() int32
- func (x *PredictOptions) GetDebug() bool
- func (x *PredictOptions) GetDebugMode() bool
- func (x *PredictOptions) GetEmbeddingTokens() []int32
- func (x *PredictOptions) GetEmbeddings() string
- func (x *PredictOptions) GetF16KV() bool
- func (x *PredictOptions) GetFrequencyPenalty() float32
- func (x *PredictOptions) GetGrammar() string
- func (x *PredictOptions) GetIgnoreEOS() bool
- func (x *PredictOptions) GetLogitBias() string
- func (x *PredictOptions) GetMLock() bool
- func (x *PredictOptions) GetMMap() bool
- func (x *PredictOptions) GetMainGPU() string
- func (x *PredictOptions) GetMirostat() int32
- func (x *PredictOptions) GetMirostatETA() float32
- func (x *PredictOptions) GetMirostatTAU() float32
- func (x *PredictOptions) GetNKeep() int32
- func (x *PredictOptions) GetNegativePrompt() string
- func (x *PredictOptions) GetNegativePromptScale() float32
- func (x *PredictOptions) GetPenalizeNL() bool
- func (x *PredictOptions) GetPenalty() float32
- func (x *PredictOptions) GetPresencePenalty() float32
- func (x *PredictOptions) GetPrompt() string
- func (x *PredictOptions) GetPromptCacheAll() bool
- func (x *PredictOptions) GetPromptCachePath() string
- func (x *PredictOptions) GetPromptCacheRO() bool
- func (x *PredictOptions) GetRepeat() int32
- func (x *PredictOptions) GetRopeFreqBase() float32
- func (x *PredictOptions) GetRopeFreqScale() float32
- func (x *PredictOptions) GetSeed() int32
- func (x *PredictOptions) GetStopPrompts() []string
- func (x *PredictOptions) GetTailFreeSamplingZ() float32
- func (x *PredictOptions) GetTemperature() float32
- func (x *PredictOptions) GetTensorSplit() string
- func (x *PredictOptions) GetThreads() int32
- func (x *PredictOptions) GetTokens() int32
- func (x *PredictOptions) GetTopK() int32
- func (x *PredictOptions) GetTopP() float32
- func (x *PredictOptions) GetTypicalP() float32
- func (*PredictOptions) ProtoMessage()
- func (x *PredictOptions) ProtoReflect() protoreflect.Message
- func (x *PredictOptions) Reset()
- func (x *PredictOptions) String() string
- type Reply
- type Result
- type TTSRequest
- func (*TTSRequest) Descriptor() ([]byte, []int)deprecated
- func (x *TTSRequest) GetDst() string
- func (x *TTSRequest) GetModel() string
- func (x *TTSRequest) GetText() string
- func (*TTSRequest) ProtoMessage()
- func (x *TTSRequest) ProtoReflect() protoreflect.Message
- func (x *TTSRequest) Reset()
- func (x *TTSRequest) String() string
- type TranscriptRequest
- func (*TranscriptRequest) Descriptor() ([]byte, []int)deprecated
- func (x *TranscriptRequest) GetDst() string
- func (x *TranscriptRequest) GetLanguage() string
- func (x *TranscriptRequest) GetThreads() uint32
- func (*TranscriptRequest) ProtoMessage()
- func (x *TranscriptRequest) ProtoReflect() protoreflect.Message
- func (x *TranscriptRequest) Reset()
- func (x *TranscriptRequest) String() string
- type TranscriptResult
- func (*TranscriptResult) Descriptor() ([]byte, []int)deprecated
- func (x *TranscriptResult) GetSegments() []*TranscriptSegment
- func (x *TranscriptResult) GetText() string
- func (*TranscriptResult) ProtoMessage()
- func (x *TranscriptResult) ProtoReflect() protoreflect.Message
- func (x *TranscriptResult) Reset()
- func (x *TranscriptResult) String() string
- type TranscriptSegment
- func (*TranscriptSegment) Descriptor() ([]byte, []int)deprecated
- func (x *TranscriptSegment) GetEnd() int64
- func (x *TranscriptSegment) GetId() int32
- func (x *TranscriptSegment) GetStart() int64
- func (x *TranscriptSegment) GetText() string
- func (x *TranscriptSegment) GetTokens() []int32
- func (*TranscriptSegment) ProtoMessage()
- func (x *TranscriptSegment) ProtoReflect() protoreflect.Message
- func (x *TranscriptSegment) Reset()
- func (x *TranscriptSegment) String() string
- type UnimplementedBackendServer
- func (UnimplementedBackendServer) AudioTranscription(context.Context, *TranscriptRequest) (*TranscriptResult, error)
- func (UnimplementedBackendServer) Embedding(context.Context, *PredictOptions) (*EmbeddingResult, error)
- func (UnimplementedBackendServer) GenerateImage(context.Context, *GenerateImageRequest) (*Result, error)
- func (UnimplementedBackendServer) Health(context.Context, *HealthMessage) (*Reply, error)
- func (UnimplementedBackendServer) LoadModel(context.Context, *ModelOptions) (*Result, error)
- func (UnimplementedBackendServer) Predict(context.Context, *PredictOptions) (*Reply, error)
- func (UnimplementedBackendServer) PredictStream(*PredictOptions, Backend_PredictStreamServer) error
- func (UnimplementedBackendServer) TTS(context.Context, *TTSRequest) (*Result, error)
- type UnsafeBackendServer
Constants ¶
This section is empty.
Variables ¶
var Backend_ServiceDesc = grpc.ServiceDesc{ ServiceName: "backend.Backend", HandlerType: (*BackendServer)(nil), Methods: []grpc.MethodDesc{ { MethodName: "Health", Handler: _Backend_Health_Handler, }, { MethodName: "Predict", Handler: _Backend_Predict_Handler, }, { MethodName: "LoadModel", Handler: _Backend_LoadModel_Handler, }, { MethodName: "Embedding", Handler: _Backend_Embedding_Handler, }, { MethodName: "GenerateImage", Handler: _Backend_GenerateImage_Handler, }, { MethodName: "AudioTranscription", Handler: _Backend_AudioTranscription_Handler, }, { MethodName: "TTS", Handler: _Backend_TTS_Handler, }, }, Streams: []grpc.StreamDesc{ { StreamName: "PredictStream", Handler: _Backend_PredictStream_Handler, ServerStreams: true, }, }, Metadata: "pkg/grpc/proto/backend.proto", }
Backend_ServiceDesc is the grpc.ServiceDesc for Backend service. It's only intended for direct use with grpc.RegisterService, and not to be introspected or modified (even as a copy)
var File_pkg_grpc_proto_backend_proto protoreflect.FileDescriptor
Functions ¶
func RegisterBackendServer ¶
func RegisterBackendServer(s grpc.ServiceRegistrar, srv BackendServer)
Types ¶
type BackendClient ¶
type BackendClient interface {
Health(ctx context.Context, in *HealthMessage, opts ...grpc.CallOption) (*Reply, error)
Predict(ctx context.Context, in *PredictOptions, opts ...grpc.CallOption) (*Reply, error)
LoadModel(ctx context.Context, in *ModelOptions, opts ...grpc.CallOption) (*Result, error)
PredictStream(ctx context.Context, in *PredictOptions, opts ...grpc.CallOption) (Backend_PredictStreamClient, error)
Embedding(ctx context.Context, in *PredictOptions, opts ...grpc.CallOption) (*EmbeddingResult, error)
GenerateImage(ctx context.Context, in *GenerateImageRequest, opts ...grpc.CallOption) (*Result, error)
AudioTranscription(ctx context.Context, in *TranscriptRequest, opts ...grpc.CallOption) (*TranscriptResult, error)
TTS(ctx context.Context, in *TTSRequest, opts ...grpc.CallOption) (*Result, error)
}
BackendClient is the client API for Backend service.
For semantics around ctx use and closing/ending streaming RPCs, please refer to https://pkg.go.dev/google.golang.org/grpc/?tab=doc#ClientConn.NewStream.
func NewBackendClient ¶
func NewBackendClient(cc grpc.ClientConnInterface) BackendClient
type BackendServer ¶
type BackendServer interface {
Health(context.Context, *HealthMessage) (*Reply, error)
Predict(context.Context, *PredictOptions) (*Reply, error)
LoadModel(context.Context, *ModelOptions) (*Result, error)
PredictStream(*PredictOptions, Backend_PredictStreamServer) error
Embedding(context.Context, *PredictOptions) (*EmbeddingResult, error)
GenerateImage(context.Context, *GenerateImageRequest) (*Result, error)
AudioTranscription(context.Context, *TranscriptRequest) (*TranscriptResult, error)
TTS(context.Context, *TTSRequest) (*Result, error)
// contains filtered or unexported methods
}
BackendServer is the server API for Backend service. All implementations must embed UnimplementedBackendServer for forward compatibility
type Backend_PredictStreamClient ¶
type Backend_PredictStreamClient interface {
Recv() (*Reply, error)
grpc.ClientStream
}
type Backend_PredictStreamServer ¶
type Backend_PredictStreamServer interface {
Send(*Reply) error
grpc.ServerStream
}
type EmbeddingResult ¶
type EmbeddingResult struct {
Embeddings []float32 `protobuf:"fixed32,1,rep,packed,name=embeddings,proto3" json:"embeddings,omitempty"`
// contains filtered or unexported fields
}
func (*EmbeddingResult) Descriptor
deprecated
func (*EmbeddingResult) Descriptor() ([]byte, []int)
Deprecated: Use EmbeddingResult.ProtoReflect.Descriptor instead.
func (*EmbeddingResult) GetEmbeddings ¶
func (x *EmbeddingResult) GetEmbeddings() []float32
func (*EmbeddingResult) ProtoMessage ¶
func (*EmbeddingResult) ProtoMessage()
func (*EmbeddingResult) ProtoReflect ¶
func (x *EmbeddingResult) ProtoReflect() protoreflect.Message
func (*EmbeddingResult) Reset ¶
func (x *EmbeddingResult) Reset()
func (*EmbeddingResult) String ¶
func (x *EmbeddingResult) String() string
type GenerateImageRequest ¶
type GenerateImageRequest struct {
Height int32 `protobuf:"varint,1,opt,name=height,proto3" json:"height,omitempty"`
Width int32 `protobuf:"varint,2,opt,name=width,proto3" json:"width,omitempty"`
Mode int32 `protobuf:"varint,3,opt,name=mode,proto3" json:"mode,omitempty"`
Step int32 `protobuf:"varint,4,opt,name=step,proto3" json:"step,omitempty"`
Seed int32 `protobuf:"varint,5,opt,name=seed,proto3" json:"seed,omitempty"`
PositivePrompt string `protobuf:"bytes,6,opt,name=positive_prompt,json=positivePrompt,proto3" json:"positive_prompt,omitempty"`
NegativePrompt string `protobuf:"bytes,7,opt,name=negative_prompt,json=negativePrompt,proto3" json:"negative_prompt,omitempty"`
Dst string `protobuf:"bytes,8,opt,name=dst,proto3" json:"dst,omitempty"`
// contains filtered or unexported fields
}
func (*GenerateImageRequest) Descriptor
deprecated
func (*GenerateImageRequest) Descriptor() ([]byte, []int)
Deprecated: Use GenerateImageRequest.ProtoReflect.Descriptor instead.
func (*GenerateImageRequest) GetDst ¶
func (x *GenerateImageRequest) GetDst() string
func (*GenerateImageRequest) GetHeight ¶
func (x *GenerateImageRequest) GetHeight() int32
func (*GenerateImageRequest) GetMode ¶
func (x *GenerateImageRequest) GetMode() int32
func (*GenerateImageRequest) GetNegativePrompt ¶
func (x *GenerateImageRequest) GetNegativePrompt() string
func (*GenerateImageRequest) GetPositivePrompt ¶
func (x *GenerateImageRequest) GetPositivePrompt() string
func (*GenerateImageRequest) GetSeed ¶
func (x *GenerateImageRequest) GetSeed() int32
func (*GenerateImageRequest) GetStep ¶
func (x *GenerateImageRequest) GetStep() int32
func (*GenerateImageRequest) GetWidth ¶
func (x *GenerateImageRequest) GetWidth() int32
func (*GenerateImageRequest) ProtoMessage ¶
func (*GenerateImageRequest) ProtoMessage()
func (*GenerateImageRequest) ProtoReflect ¶
func (x *GenerateImageRequest) ProtoReflect() protoreflect.Message
func (*GenerateImageRequest) Reset ¶
func (x *GenerateImageRequest) Reset()
func (*GenerateImageRequest) String ¶
func (x *GenerateImageRequest) String() string
type HealthMessage ¶
type HealthMessage struct {
// contains filtered or unexported fields
}
func (*HealthMessage) Descriptor
deprecated
func (*HealthMessage) Descriptor() ([]byte, []int)
Deprecated: Use HealthMessage.ProtoReflect.Descriptor instead.
func (*HealthMessage) ProtoMessage ¶
func (*HealthMessage) ProtoMessage()
func (*HealthMessage) ProtoReflect ¶
func (x *HealthMessage) ProtoReflect() protoreflect.Message
func (*HealthMessage) Reset ¶
func (x *HealthMessage) Reset()
func (*HealthMessage) String ¶
func (x *HealthMessage) String() string
type ModelOptions ¶
type ModelOptions struct {
Model string `protobuf:"bytes,1,opt,name=Model,proto3" json:"Model,omitempty"`
ContextSize int32 `protobuf:"varint,2,opt,name=ContextSize,proto3" json:"ContextSize,omitempty"`
Seed int32 `protobuf:"varint,3,opt,name=Seed,proto3" json:"Seed,omitempty"`
NBatch int32 `protobuf:"varint,4,opt,name=NBatch,proto3" json:"NBatch,omitempty"`
F16Memory bool `protobuf:"varint,5,opt,name=F16Memory,proto3" json:"F16Memory,omitempty"`
MLock bool `protobuf:"varint,6,opt,name=MLock,proto3" json:"MLock,omitempty"`
MMap bool `protobuf:"varint,7,opt,name=MMap,proto3" json:"MMap,omitempty"`
VocabOnly bool `protobuf:"varint,8,opt,name=VocabOnly,proto3" json:"VocabOnly,omitempty"`
LowVRAM bool `protobuf:"varint,9,opt,name=LowVRAM,proto3" json:"LowVRAM,omitempty"`
Embeddings bool `protobuf:"varint,10,opt,name=Embeddings,proto3" json:"Embeddings,omitempty"`
NUMA bool `protobuf:"varint,11,opt,name=NUMA,proto3" json:"NUMA,omitempty"`
NGPULayers int32 `protobuf:"varint,12,opt,name=NGPULayers,proto3" json:"NGPULayers,omitempty"`
MainGPU string `protobuf:"bytes,13,opt,name=MainGPU,proto3" json:"MainGPU,omitempty"`
TensorSplit string `protobuf:"bytes,14,opt,name=TensorSplit,proto3" json:"TensorSplit,omitempty"`
Threads int32 `protobuf:"varint,15,opt,name=Threads,proto3" json:"Threads,omitempty"`
LibrarySearchPath string `protobuf:"bytes,16,opt,name=LibrarySearchPath,proto3" json:"LibrarySearchPath,omitempty"`
RopeFreqBase float32 `protobuf:"fixed32,17,opt,name=RopeFreqBase,proto3" json:"RopeFreqBase,omitempty"`
RopeFreqScale float32 `protobuf:"fixed32,18,opt,name=RopeFreqScale,proto3" json:"RopeFreqScale,omitempty"`
RMSNormEps float32 `protobuf:"fixed32,19,opt,name=RMSNormEps,proto3" json:"RMSNormEps,omitempty"`
NGQA int32 `protobuf:"varint,20,opt,name=NGQA,proto3" json:"NGQA,omitempty"`
// contains filtered or unexported fields
}
func (*ModelOptions) Descriptor
deprecated
func (*ModelOptions) Descriptor() ([]byte, []int)
Deprecated: Use ModelOptions.ProtoReflect.Descriptor instead.
func (*ModelOptions) GetContextSize ¶
func (x *ModelOptions) GetContextSize() int32
func (*ModelOptions) GetEmbeddings ¶
func (x *ModelOptions) GetEmbeddings() bool
func (*ModelOptions) GetF16Memory ¶
func (x *ModelOptions) GetF16Memory() bool
func (*ModelOptions) GetLibrarySearchPath ¶
func (x *ModelOptions) GetLibrarySearchPath() string
func (*ModelOptions) GetLowVRAM ¶
func (x *ModelOptions) GetLowVRAM() bool
func (*ModelOptions) GetMLock ¶
func (x *ModelOptions) GetMLock() bool
func (*ModelOptions) GetMMap ¶
func (x *ModelOptions) GetMMap() bool
func (*ModelOptions) GetMainGPU ¶
func (x *ModelOptions) GetMainGPU() string
func (*ModelOptions) GetModel ¶
func (x *ModelOptions) GetModel() string
func (*ModelOptions) GetNBatch ¶
func (x *ModelOptions) GetNBatch() int32
func (*ModelOptions) GetNGPULayers ¶
func (x *ModelOptions) GetNGPULayers() int32
func (*ModelOptions) GetNGQA ¶ added in v1.23.2
func (x *ModelOptions) GetNGQA() int32
func (*ModelOptions) GetNUMA ¶
func (x *ModelOptions) GetNUMA() bool
func (*ModelOptions) GetRMSNormEps ¶ added in v1.23.2
func (x *ModelOptions) GetRMSNormEps() float32
func (*ModelOptions) GetRopeFreqBase ¶ added in v1.23.0
func (x *ModelOptions) GetRopeFreqBase() float32
func (*ModelOptions) GetRopeFreqScale ¶ added in v1.23.0
func (x *ModelOptions) GetRopeFreqScale() float32
func (*ModelOptions) GetSeed ¶
func (x *ModelOptions) GetSeed() int32
func (*ModelOptions) GetTensorSplit ¶
func (x *ModelOptions) GetTensorSplit() string
func (*ModelOptions) GetThreads ¶
func (x *ModelOptions) GetThreads() int32
func (*ModelOptions) GetVocabOnly ¶
func (x *ModelOptions) GetVocabOnly() bool
func (*ModelOptions) ProtoMessage ¶
func (*ModelOptions) ProtoMessage()
func (*ModelOptions) ProtoReflect ¶
func (x *ModelOptions) ProtoReflect() protoreflect.Message
func (*ModelOptions) Reset ¶
func (x *ModelOptions) Reset()
func (*ModelOptions) String ¶
func (x *ModelOptions) String() string
type PredictOptions ¶
type PredictOptions struct {
Prompt string `protobuf:"bytes,1,opt,name=Prompt,proto3" json:"Prompt,omitempty"`
Seed int32 `protobuf:"varint,2,opt,name=Seed,proto3" json:"Seed,omitempty"`
Threads int32 `protobuf:"varint,3,opt,name=Threads,proto3" json:"Threads,omitempty"`
Tokens int32 `protobuf:"varint,4,opt,name=Tokens,proto3" json:"Tokens,omitempty"`
TopK int32 `protobuf:"varint,5,opt,name=TopK,proto3" json:"TopK,omitempty"`
Repeat int32 `protobuf:"varint,6,opt,name=Repeat,proto3" json:"Repeat,omitempty"`
Batch int32 `protobuf:"varint,7,opt,name=Batch,proto3" json:"Batch,omitempty"`
NKeep int32 `protobuf:"varint,8,opt,name=NKeep,proto3" json:"NKeep,omitempty"`
Temperature float32 `protobuf:"fixed32,9,opt,name=Temperature,proto3" json:"Temperature,omitempty"`
Penalty float32 `protobuf:"fixed32,10,opt,name=Penalty,proto3" json:"Penalty,omitempty"`
F16KV bool `protobuf:"varint,11,opt,name=F16KV,proto3" json:"F16KV,omitempty"`
DebugMode bool `protobuf:"varint,12,opt,name=DebugMode,proto3" json:"DebugMode,omitempty"`
StopPrompts []string `protobuf:"bytes,13,rep,name=StopPrompts,proto3" json:"StopPrompts,omitempty"`
IgnoreEOS bool `protobuf:"varint,14,opt,name=IgnoreEOS,proto3" json:"IgnoreEOS,omitempty"`
TailFreeSamplingZ float32 `protobuf:"fixed32,15,opt,name=TailFreeSamplingZ,proto3" json:"TailFreeSamplingZ,omitempty"`
TypicalP float32 `protobuf:"fixed32,16,opt,name=TypicalP,proto3" json:"TypicalP,omitempty"`
FrequencyPenalty float32 `protobuf:"fixed32,17,opt,name=FrequencyPenalty,proto3" json:"FrequencyPenalty,omitempty"`
PresencePenalty float32 `protobuf:"fixed32,18,opt,name=PresencePenalty,proto3" json:"PresencePenalty,omitempty"`
Mirostat int32 `protobuf:"varint,19,opt,name=Mirostat,proto3" json:"Mirostat,omitempty"`
MirostatETA float32 `protobuf:"fixed32,20,opt,name=MirostatETA,proto3" json:"MirostatETA,omitempty"`
MirostatTAU float32 `protobuf:"fixed32,21,opt,name=MirostatTAU,proto3" json:"MirostatTAU,omitempty"`
PenalizeNL bool `protobuf:"varint,22,opt,name=PenalizeNL,proto3" json:"PenalizeNL,omitempty"`
LogitBias string `protobuf:"bytes,23,opt,name=LogitBias,proto3" json:"LogitBias,omitempty"`
MLock bool `protobuf:"varint,25,opt,name=MLock,proto3" json:"MLock,omitempty"`
MMap bool `protobuf:"varint,26,opt,name=MMap,proto3" json:"MMap,omitempty"`
PromptCacheAll bool `protobuf:"varint,27,opt,name=PromptCacheAll,proto3" json:"PromptCacheAll,omitempty"`
PromptCacheRO bool `protobuf:"varint,28,opt,name=PromptCacheRO,proto3" json:"PromptCacheRO,omitempty"`
Grammar string `protobuf:"bytes,29,opt,name=Grammar,proto3" json:"Grammar,omitempty"`
MainGPU string `protobuf:"bytes,30,opt,name=MainGPU,proto3" json:"MainGPU,omitempty"`
TensorSplit string `protobuf:"bytes,31,opt,name=TensorSplit,proto3" json:"TensorSplit,omitempty"`
TopP float32 `protobuf:"fixed32,32,opt,name=TopP,proto3" json:"TopP,omitempty"`
PromptCachePath string `protobuf:"bytes,33,opt,name=PromptCachePath,proto3" json:"PromptCachePath,omitempty"`
Debug bool `protobuf:"varint,34,opt,name=Debug,proto3" json:"Debug,omitempty"`
EmbeddingTokens []int32 `protobuf:"varint,35,rep,packed,name=EmbeddingTokens,proto3" json:"EmbeddingTokens,omitempty"`
Embeddings string `protobuf:"bytes,36,opt,name=Embeddings,proto3" json:"Embeddings,omitempty"`
RopeFreqBase float32 `protobuf:"fixed32,37,opt,name=RopeFreqBase,proto3" json:"RopeFreqBase,omitempty"`
RopeFreqScale float32 `protobuf:"fixed32,38,opt,name=RopeFreqScale,proto3" json:"RopeFreqScale,omitempty"`
NegativePromptScale float32 `protobuf:"fixed32,39,opt,name=NegativePromptScale,proto3" json:"NegativePromptScale,omitempty"`
NegativePrompt string `protobuf:"bytes,40,opt,name=NegativePrompt,proto3" json:"NegativePrompt,omitempty"`
// contains filtered or unexported fields
}
The request message containing the user's name.
func (*PredictOptions) Descriptor
deprecated
func (*PredictOptions) Descriptor() ([]byte, []int)
Deprecated: Use PredictOptions.ProtoReflect.Descriptor instead.
func (*PredictOptions) GetBatch ¶
func (x *PredictOptions) GetBatch() int32
func (*PredictOptions) GetDebug ¶
func (x *PredictOptions) GetDebug() bool
func (*PredictOptions) GetDebugMode ¶
func (x *PredictOptions) GetDebugMode() bool
func (*PredictOptions) GetEmbeddingTokens ¶
func (x *PredictOptions) GetEmbeddingTokens() []int32
func (*PredictOptions) GetEmbeddings ¶
func (x *PredictOptions) GetEmbeddings() string
func (*PredictOptions) GetF16KV ¶
func (x *PredictOptions) GetF16KV() bool
func (*PredictOptions) GetFrequencyPenalty ¶
func (x *PredictOptions) GetFrequencyPenalty() float32
func (*PredictOptions) GetGrammar ¶
func (x *PredictOptions) GetGrammar() string
func (*PredictOptions) GetIgnoreEOS ¶
func (x *PredictOptions) GetIgnoreEOS() bool
func (*PredictOptions) GetLogitBias ¶
func (x *PredictOptions) GetLogitBias() string
func (*PredictOptions) GetMLock ¶
func (x *PredictOptions) GetMLock() bool
func (*PredictOptions) GetMMap ¶
func (x *PredictOptions) GetMMap() bool
func (*PredictOptions) GetMainGPU ¶
func (x *PredictOptions) GetMainGPU() string
func (*PredictOptions) GetMirostat ¶
func (x *PredictOptions) GetMirostat() int32
func (*PredictOptions) GetMirostatETA ¶
func (x *PredictOptions) GetMirostatETA() float32
func (*PredictOptions) GetMirostatTAU ¶
func (x *PredictOptions) GetMirostatTAU() float32
func (*PredictOptions) GetNKeep ¶
func (x *PredictOptions) GetNKeep() int32
func (*PredictOptions) GetNegativePrompt ¶ added in v1.23.0
func (x *PredictOptions) GetNegativePrompt() string
func (*PredictOptions) GetNegativePromptScale ¶ added in v1.23.0
func (x *PredictOptions) GetNegativePromptScale() float32
func (*PredictOptions) GetPenalizeNL ¶
func (x *PredictOptions) GetPenalizeNL() bool
func (*PredictOptions) GetPenalty ¶
func (x *PredictOptions) GetPenalty() float32
func (*PredictOptions) GetPresencePenalty ¶
func (x *PredictOptions) GetPresencePenalty() float32
func (*PredictOptions) GetPrompt ¶
func (x *PredictOptions) GetPrompt() string
func (*PredictOptions) GetPromptCacheAll ¶
func (x *PredictOptions) GetPromptCacheAll() bool
func (*PredictOptions) GetPromptCachePath ¶
func (x *PredictOptions) GetPromptCachePath() string
func (*PredictOptions) GetPromptCacheRO ¶
func (x *PredictOptions) GetPromptCacheRO() bool
func (*PredictOptions) GetRepeat ¶
func (x *PredictOptions) GetRepeat() int32
func (*PredictOptions) GetRopeFreqBase ¶ added in v1.23.0
func (x *PredictOptions) GetRopeFreqBase() float32
func (*PredictOptions) GetRopeFreqScale ¶ added in v1.23.0
func (x *PredictOptions) GetRopeFreqScale() float32
func (*PredictOptions) GetSeed ¶
func (x *PredictOptions) GetSeed() int32
func (*PredictOptions) GetStopPrompts ¶
func (x *PredictOptions) GetStopPrompts() []string
func (*PredictOptions) GetTailFreeSamplingZ ¶
func (x *PredictOptions) GetTailFreeSamplingZ() float32
func (*PredictOptions) GetTemperature ¶
func (x *PredictOptions) GetTemperature() float32
func (*PredictOptions) GetTensorSplit ¶
func (x *PredictOptions) GetTensorSplit() string
func (*PredictOptions) GetThreads ¶
func (x *PredictOptions) GetThreads() int32
func (*PredictOptions) GetTokens ¶
func (x *PredictOptions) GetTokens() int32
func (*PredictOptions) GetTopK ¶
func (x *PredictOptions) GetTopK() int32
func (*PredictOptions) GetTopP ¶
func (x *PredictOptions) GetTopP() float32
func (*PredictOptions) GetTypicalP ¶
func (x *PredictOptions) GetTypicalP() float32
func (*PredictOptions) ProtoMessage ¶
func (*PredictOptions) ProtoMessage()
func (*PredictOptions) ProtoReflect ¶
func (x *PredictOptions) ProtoReflect() protoreflect.Message
func (*PredictOptions) Reset ¶
func (x *PredictOptions) Reset()
func (*PredictOptions) String ¶
func (x *PredictOptions) String() string
type Reply ¶
type Reply struct {
Message []byte `protobuf:"bytes,1,opt,name=message,proto3" json:"message,omitempty"`
// contains filtered or unexported fields
}
The response message containing the result
func (*Reply) Descriptor
deprecated
func (*Reply) GetMessage ¶
func (*Reply) ProtoMessage ¶
func (*Reply) ProtoMessage()
func (*Reply) ProtoReflect ¶
func (x *Reply) ProtoReflect() protoreflect.Message
type Result ¶
type Result struct {
Message string `protobuf:"bytes,1,opt,name=message,proto3" json:"message,omitempty"`
Success bool `protobuf:"varint,2,opt,name=success,proto3" json:"success,omitempty"`
// contains filtered or unexported fields
}
func (*Result) Descriptor
deprecated
func (*Result) GetMessage ¶
func (*Result) GetSuccess ¶
func (*Result) ProtoMessage ¶
func (*Result) ProtoMessage()
func (*Result) ProtoReflect ¶
func (x *Result) ProtoReflect() protoreflect.Message
type TTSRequest ¶
type TTSRequest struct {
Text string `protobuf:"bytes,1,opt,name=text,proto3" json:"text,omitempty"`
Model string `protobuf:"bytes,2,opt,name=model,proto3" json:"model,omitempty"`
Dst string `protobuf:"bytes,3,opt,name=dst,proto3" json:"dst,omitempty"`
// contains filtered or unexported fields
}
func (*TTSRequest) Descriptor
deprecated
func (*TTSRequest) Descriptor() ([]byte, []int)
Deprecated: Use TTSRequest.ProtoReflect.Descriptor instead.
func (*TTSRequest) GetDst ¶
func (x *TTSRequest) GetDst() string
func (*TTSRequest) GetModel ¶
func (x *TTSRequest) GetModel() string
func (*TTSRequest) GetText ¶
func (x *TTSRequest) GetText() string
func (*TTSRequest) ProtoMessage ¶
func (*TTSRequest) ProtoMessage()
func (*TTSRequest) ProtoReflect ¶
func (x *TTSRequest) ProtoReflect() protoreflect.Message
func (*TTSRequest) Reset ¶
func (x *TTSRequest) Reset()
func (*TTSRequest) String ¶
func (x *TTSRequest) String() string
type TranscriptRequest ¶
type TranscriptRequest struct {
Dst string `protobuf:"bytes,2,opt,name=dst,proto3" json:"dst,omitempty"`
Language string `protobuf:"bytes,3,opt,name=language,proto3" json:"language,omitempty"`
Threads uint32 `protobuf:"varint,4,opt,name=threads,proto3" json:"threads,omitempty"`
// contains filtered or unexported fields
}
func (*TranscriptRequest) Descriptor
deprecated
func (*TranscriptRequest) Descriptor() ([]byte, []int)
Deprecated: Use TranscriptRequest.ProtoReflect.Descriptor instead.
func (*TranscriptRequest) GetDst ¶
func (x *TranscriptRequest) GetDst() string
func (*TranscriptRequest) GetLanguage ¶
func (x *TranscriptRequest) GetLanguage() string
func (*TranscriptRequest) GetThreads ¶
func (x *TranscriptRequest) GetThreads() uint32
func (*TranscriptRequest) ProtoMessage ¶
func (*TranscriptRequest) ProtoMessage()
func (*TranscriptRequest) ProtoReflect ¶
func (x *TranscriptRequest) ProtoReflect() protoreflect.Message
func (*TranscriptRequest) Reset ¶
func (x *TranscriptRequest) Reset()
func (*TranscriptRequest) String ¶
func (x *TranscriptRequest) String() string
type TranscriptResult ¶
type TranscriptResult struct {
Segments []*TranscriptSegment `protobuf:"bytes,1,rep,name=segments,proto3" json:"segments,omitempty"`
Text string `protobuf:"bytes,2,opt,name=text,proto3" json:"text,omitempty"`
// contains filtered or unexported fields
}
func (*TranscriptResult) Descriptor
deprecated
func (*TranscriptResult) Descriptor() ([]byte, []int)
Deprecated: Use TranscriptResult.ProtoReflect.Descriptor instead.
func (*TranscriptResult) GetSegments ¶
func (x *TranscriptResult) GetSegments() []*TranscriptSegment
func (*TranscriptResult) GetText ¶
func (x *TranscriptResult) GetText() string
func (*TranscriptResult) ProtoMessage ¶
func (*TranscriptResult) ProtoMessage()
func (*TranscriptResult) ProtoReflect ¶
func (x *TranscriptResult) ProtoReflect() protoreflect.Message
func (*TranscriptResult) Reset ¶
func (x *TranscriptResult) Reset()
func (*TranscriptResult) String ¶
func (x *TranscriptResult) String() string
type TranscriptSegment ¶
type TranscriptSegment struct {
Id int32 `protobuf:"varint,1,opt,name=id,proto3" json:"id,omitempty"`
Start int64 `protobuf:"varint,2,opt,name=start,proto3" json:"start,omitempty"`
End int64 `protobuf:"varint,3,opt,name=end,proto3" json:"end,omitempty"`
Text string `protobuf:"bytes,4,opt,name=text,proto3" json:"text,omitempty"`
Tokens []int32 `protobuf:"varint,5,rep,packed,name=tokens,proto3" json:"tokens,omitempty"`
// contains filtered or unexported fields
}
func (*TranscriptSegment) Descriptor
deprecated
func (*TranscriptSegment) Descriptor() ([]byte, []int)
Deprecated: Use TranscriptSegment.ProtoReflect.Descriptor instead.
func (*TranscriptSegment) GetEnd ¶
func (x *TranscriptSegment) GetEnd() int64
func (*TranscriptSegment) GetId ¶
func (x *TranscriptSegment) GetId() int32
func (*TranscriptSegment) GetStart ¶
func (x *TranscriptSegment) GetStart() int64
func (*TranscriptSegment) GetText ¶
func (x *TranscriptSegment) GetText() string
func (*TranscriptSegment) GetTokens ¶
func (x *TranscriptSegment) GetTokens() []int32
func (*TranscriptSegment) ProtoMessage ¶
func (*TranscriptSegment) ProtoMessage()
func (*TranscriptSegment) ProtoReflect ¶
func (x *TranscriptSegment) ProtoReflect() protoreflect.Message
func (*TranscriptSegment) Reset ¶
func (x *TranscriptSegment) Reset()
func (*TranscriptSegment) String ¶
func (x *TranscriptSegment) String() string
type UnimplementedBackendServer ¶
type UnimplementedBackendServer struct {
}
UnimplementedBackendServer must be embedded to have forward compatible implementations.
func (UnimplementedBackendServer) AudioTranscription ¶
func (UnimplementedBackendServer) AudioTranscription(context.Context, *TranscriptRequest) (*TranscriptResult, error)
func (UnimplementedBackendServer) Embedding ¶
func (UnimplementedBackendServer) Embedding(context.Context, *PredictOptions) (*EmbeddingResult, error)
func (UnimplementedBackendServer) GenerateImage ¶
func (UnimplementedBackendServer) GenerateImage(context.Context, *GenerateImageRequest) (*Result, error)
func (UnimplementedBackendServer) Health ¶
func (UnimplementedBackendServer) Health(context.Context, *HealthMessage) (*Reply, error)
func (UnimplementedBackendServer) LoadModel ¶
func (UnimplementedBackendServer) LoadModel(context.Context, *ModelOptions) (*Result, error)
func (UnimplementedBackendServer) Predict ¶
func (UnimplementedBackendServer) Predict(context.Context, *PredictOptions) (*Reply, error)
func (UnimplementedBackendServer) PredictStream ¶
func (UnimplementedBackendServer) PredictStream(*PredictOptions, Backend_PredictStreamServer) error
func (UnimplementedBackendServer) TTS ¶
func (UnimplementedBackendServer) TTS(context.Context, *TTSRequest) (*Result, error)
type UnsafeBackendServer ¶
type UnsafeBackendServer interface {
// contains filtered or unexported methods
}
UnsafeBackendServer may be embedded to opt out of forward compatibility for this service. Use of this interface is not recommended, as added methods to BackendServer will result in compilation errors.