proto

package
v1.25.0 Latest Latest
Warning

This package is not in the latest version of its module.

Go to latest
Published: Aug 26, 2023 License: MIT Imports: 8 Imported by: 1

Documentation

Index

Constants

This section is empty.

Variables

View Source
var (
	StatusResponse_State_name = map[int32]string{
		0:  "UNINITIALIZED",
		1:  "BUSY",
		2:  "READY",
		-1: "ERROR",
	}
	StatusResponse_State_value = map[string]int32{
		"UNINITIALIZED": 0,
		"BUSY":          1,
		"READY":         2,
		"ERROR":         -1,
	}
)

Enum value maps for StatusResponse_State.

View Source
var Backend_ServiceDesc = grpc.ServiceDesc{
	ServiceName: "backend.Backend",
	HandlerType: (*BackendServer)(nil),
	Methods: []grpc.MethodDesc{
		{
			MethodName: "Health",
			Handler:    _Backend_Health_Handler,
		},
		{
			MethodName: "Predict",
			Handler:    _Backend_Predict_Handler,
		},
		{
			MethodName: "LoadModel",
			Handler:    _Backend_LoadModel_Handler,
		},
		{
			MethodName: "Embedding",
			Handler:    _Backend_Embedding_Handler,
		},
		{
			MethodName: "GenerateImage",
			Handler:    _Backend_GenerateImage_Handler,
		},
		{
			MethodName: "AudioTranscription",
			Handler:    _Backend_AudioTranscription_Handler,
		},
		{
			MethodName: "TTS",
			Handler:    _Backend_TTS_Handler,
		},
		{
			MethodName: "TokenizeString",
			Handler:    _Backend_TokenizeString_Handler,
		},
		{
			MethodName: "Status",
			Handler:    _Backend_Status_Handler,
		},
	},
	Streams: []grpc.StreamDesc{
		{
			StreamName:    "PredictStream",
			Handler:       _Backend_PredictStream_Handler,
			ServerStreams: true,
		},
	},
	Metadata: "pkg/grpc/proto/backend.proto",
}

Backend_ServiceDesc is the grpc.ServiceDesc for Backend service. It's only intended for direct use with grpc.RegisterService, and not to be introspected or modified (even as a copy)

View Source
var File_pkg_grpc_proto_backend_proto protoreflect.FileDescriptor

Functions

func RegisterBackendServer

func RegisterBackendServer(s grpc.ServiceRegistrar, srv BackendServer)

Types

type BackendClient

type BackendClient interface {
	Health(ctx context.Context, in *HealthMessage, opts ...grpc.CallOption) (*Reply, error)
	Predict(ctx context.Context, in *PredictOptions, opts ...grpc.CallOption) (*Reply, error)
	LoadModel(ctx context.Context, in *ModelOptions, opts ...grpc.CallOption) (*Result, error)
	PredictStream(ctx context.Context, in *PredictOptions, opts ...grpc.CallOption) (Backend_PredictStreamClient, error)
	Embedding(ctx context.Context, in *PredictOptions, opts ...grpc.CallOption) (*EmbeddingResult, error)
	GenerateImage(ctx context.Context, in *GenerateImageRequest, opts ...grpc.CallOption) (*Result, error)
	AudioTranscription(ctx context.Context, in *TranscriptRequest, opts ...grpc.CallOption) (*TranscriptResult, error)
	TTS(ctx context.Context, in *TTSRequest, opts ...grpc.CallOption) (*Result, error)
	TokenizeString(ctx context.Context, in *PredictOptions, opts ...grpc.CallOption) (*TokenizationResponse, error)
	Status(ctx context.Context, in *HealthMessage, opts ...grpc.CallOption) (*StatusResponse, error)
}

BackendClient is the client API for Backend service.

For semantics around ctx use and closing/ending streaming RPCs, please refer to https://pkg.go.dev/google.golang.org/grpc/?tab=doc#ClientConn.NewStream.

func NewBackendClient

func NewBackendClient(cc grpc.ClientConnInterface) BackendClient

type BackendServer

type BackendServer interface {
	Health(context.Context, *HealthMessage) (*Reply, error)
	Predict(context.Context, *PredictOptions) (*Reply, error)
	LoadModel(context.Context, *ModelOptions) (*Result, error)
	PredictStream(*PredictOptions, Backend_PredictStreamServer) error
	Embedding(context.Context, *PredictOptions) (*EmbeddingResult, error)
	GenerateImage(context.Context, *GenerateImageRequest) (*Result, error)
	AudioTranscription(context.Context, *TranscriptRequest) (*TranscriptResult, error)
	TTS(context.Context, *TTSRequest) (*Result, error)
	TokenizeString(context.Context, *PredictOptions) (*TokenizationResponse, error)
	Status(context.Context, *HealthMessage) (*StatusResponse, error)
	// contains filtered or unexported methods
}

BackendServer is the server API for Backend service. All implementations must embed UnimplementedBackendServer for forward compatibility

type Backend_PredictStreamClient

type Backend_PredictStreamClient interface {
	Recv() (*Reply, error)
	grpc.ClientStream
}

type Backend_PredictStreamServer

type Backend_PredictStreamServer interface {
	Send(*Reply) error
	grpc.ServerStream
}

type EmbeddingResult

type EmbeddingResult struct {
	Embeddings []float32 `protobuf:"fixed32,1,rep,packed,name=embeddings,proto3" json:"embeddings,omitempty"`
	// contains filtered or unexported fields
}

func (*EmbeddingResult) Descriptor deprecated

func (*EmbeddingResult) Descriptor() ([]byte, []int)

Deprecated: Use EmbeddingResult.ProtoReflect.Descriptor instead.

func (*EmbeddingResult) GetEmbeddings

func (x *EmbeddingResult) GetEmbeddings() []float32

func (*EmbeddingResult) ProtoMessage

func (*EmbeddingResult) ProtoMessage()

func (*EmbeddingResult) ProtoReflect

func (x *EmbeddingResult) ProtoReflect() protoreflect.Message

func (*EmbeddingResult) Reset

func (x *EmbeddingResult) Reset()

func (*EmbeddingResult) String

func (x *EmbeddingResult) String() string

type GenerateImageRequest

type GenerateImageRequest struct {
	Height         int32  `protobuf:"varint,1,opt,name=height,proto3" json:"height,omitempty"`
	Width          int32  `protobuf:"varint,2,opt,name=width,proto3" json:"width,omitempty"`
	Mode           int32  `protobuf:"varint,3,opt,name=mode,proto3" json:"mode,omitempty"`
	Step           int32  `protobuf:"varint,4,opt,name=step,proto3" json:"step,omitempty"`
	Seed           int32  `protobuf:"varint,5,opt,name=seed,proto3" json:"seed,omitempty"`
	PositivePrompt string `protobuf:"bytes,6,opt,name=positive_prompt,json=positivePrompt,proto3" json:"positive_prompt,omitempty"`
	NegativePrompt string `protobuf:"bytes,7,opt,name=negative_prompt,json=negativePrompt,proto3" json:"negative_prompt,omitempty"`
	Dst            string `protobuf:"bytes,8,opt,name=dst,proto3" json:"dst,omitempty"`
	Src            string `protobuf:"bytes,9,opt,name=src,proto3" json:"src,omitempty"`
	// Diffusers
	EnableParameters string `protobuf:"bytes,10,opt,name=EnableParameters,proto3" json:"EnableParameters,omitempty"`
	CLIPSkip         int32  `protobuf:"varint,11,opt,name=CLIPSkip,proto3" json:"CLIPSkip,omitempty"`
	// contains filtered or unexported fields
}

func (*GenerateImageRequest) Descriptor deprecated

func (*GenerateImageRequest) Descriptor() ([]byte, []int)

Deprecated: Use GenerateImageRequest.ProtoReflect.Descriptor instead.

func (*GenerateImageRequest) GetCLIPSkip added in v1.25.0

func (x *GenerateImageRequest) GetCLIPSkip() int32

func (*GenerateImageRequest) GetDst

func (x *GenerateImageRequest) GetDst() string

func (*GenerateImageRequest) GetEnableParameters added in v1.25.0

func (x *GenerateImageRequest) GetEnableParameters() string

func (*GenerateImageRequest) GetHeight

func (x *GenerateImageRequest) GetHeight() int32

func (*GenerateImageRequest) GetMode

func (x *GenerateImageRequest) GetMode() int32

func (*GenerateImageRequest) GetNegativePrompt

func (x *GenerateImageRequest) GetNegativePrompt() string

func (*GenerateImageRequest) GetPositivePrompt

func (x *GenerateImageRequest) GetPositivePrompt() string

func (*GenerateImageRequest) GetSeed

func (x *GenerateImageRequest) GetSeed() int32

func (*GenerateImageRequest) GetSrc added in v1.25.0

func (x *GenerateImageRequest) GetSrc() string

func (*GenerateImageRequest) GetStep

func (x *GenerateImageRequest) GetStep() int32

func (*GenerateImageRequest) GetWidth

func (x *GenerateImageRequest) GetWidth() int32

func (*GenerateImageRequest) ProtoMessage

func (*GenerateImageRequest) ProtoMessage()

func (*GenerateImageRequest) ProtoReflect

func (x *GenerateImageRequest) ProtoReflect() protoreflect.Message

func (*GenerateImageRequest) Reset

func (x *GenerateImageRequest) Reset()

func (*GenerateImageRequest) String

func (x *GenerateImageRequest) String() string

type HealthMessage

type HealthMessage struct {
	// contains filtered or unexported fields
}

func (*HealthMessage) Descriptor deprecated

func (*HealthMessage) Descriptor() ([]byte, []int)

Deprecated: Use HealthMessage.ProtoReflect.Descriptor instead.

func (*HealthMessage) ProtoMessage

func (*HealthMessage) ProtoMessage()

func (*HealthMessage) ProtoReflect

func (x *HealthMessage) ProtoReflect() protoreflect.Message

func (*HealthMessage) Reset

func (x *HealthMessage) Reset()

func (*HealthMessage) String

func (x *HealthMessage) String() string

type MemoryUsageData added in v1.25.0

type MemoryUsageData struct {
	Total     uint64            `protobuf:"varint,1,opt,name=total,proto3" json:"total,omitempty"`
	Breakdown map[string]uint64 `` /* 160-byte string literal not displayed */
	// contains filtered or unexported fields
}

func (*MemoryUsageData) Descriptor deprecated added in v1.25.0

func (*MemoryUsageData) Descriptor() ([]byte, []int)

Deprecated: Use MemoryUsageData.ProtoReflect.Descriptor instead.

func (*MemoryUsageData) GetBreakdown added in v1.25.0

func (x *MemoryUsageData) GetBreakdown() map[string]uint64

func (*MemoryUsageData) GetTotal added in v1.25.0

func (x *MemoryUsageData) GetTotal() uint64

func (*MemoryUsageData) ProtoMessage added in v1.25.0

func (*MemoryUsageData) ProtoMessage()

func (*MemoryUsageData) ProtoReflect added in v1.25.0

func (x *MemoryUsageData) ProtoReflect() protoreflect.Message

func (*MemoryUsageData) Reset added in v1.25.0

func (x *MemoryUsageData) Reset()

func (*MemoryUsageData) String added in v1.25.0

func (x *MemoryUsageData) String() string

type ModelOptions

type ModelOptions struct {
	Model             string  `protobuf:"bytes,1,opt,name=Model,proto3" json:"Model,omitempty"`
	ContextSize       int32   `protobuf:"varint,2,opt,name=ContextSize,proto3" json:"ContextSize,omitempty"`
	Seed              int32   `protobuf:"varint,3,opt,name=Seed,proto3" json:"Seed,omitempty"`
	NBatch            int32   `protobuf:"varint,4,opt,name=NBatch,proto3" json:"NBatch,omitempty"`
	F16Memory         bool    `protobuf:"varint,5,opt,name=F16Memory,proto3" json:"F16Memory,omitempty"`
	MLock             bool    `protobuf:"varint,6,opt,name=MLock,proto3" json:"MLock,omitempty"`
	MMap              bool    `protobuf:"varint,7,opt,name=MMap,proto3" json:"MMap,omitempty"`
	VocabOnly         bool    `protobuf:"varint,8,opt,name=VocabOnly,proto3" json:"VocabOnly,omitempty"`
	LowVRAM           bool    `protobuf:"varint,9,opt,name=LowVRAM,proto3" json:"LowVRAM,omitempty"`
	Embeddings        bool    `protobuf:"varint,10,opt,name=Embeddings,proto3" json:"Embeddings,omitempty"`
	NUMA              bool    `protobuf:"varint,11,opt,name=NUMA,proto3" json:"NUMA,omitempty"`
	NGPULayers        int32   `protobuf:"varint,12,opt,name=NGPULayers,proto3" json:"NGPULayers,omitempty"`
	MainGPU           string  `protobuf:"bytes,13,opt,name=MainGPU,proto3" json:"MainGPU,omitempty"`
	TensorSplit       string  `protobuf:"bytes,14,opt,name=TensorSplit,proto3" json:"TensorSplit,omitempty"`
	Threads           int32   `protobuf:"varint,15,opt,name=Threads,proto3" json:"Threads,omitempty"`
	LibrarySearchPath string  `protobuf:"bytes,16,opt,name=LibrarySearchPath,proto3" json:"LibrarySearchPath,omitempty"`
	RopeFreqBase      float32 `protobuf:"fixed32,17,opt,name=RopeFreqBase,proto3" json:"RopeFreqBase,omitempty"`
	RopeFreqScale     float32 `protobuf:"fixed32,18,opt,name=RopeFreqScale,proto3" json:"RopeFreqScale,omitempty"`
	RMSNormEps        float32 `protobuf:"fixed32,19,opt,name=RMSNormEps,proto3" json:"RMSNormEps,omitempty"`
	NGQA              int32   `protobuf:"varint,20,opt,name=NGQA,proto3" json:"NGQA,omitempty"`
	ModelFile         string  `protobuf:"bytes,21,opt,name=ModelFile,proto3" json:"ModelFile,omitempty"`
	// AutoGPTQ
	Device           string `protobuf:"bytes,22,opt,name=Device,proto3" json:"Device,omitempty"`
	UseTriton        bool   `protobuf:"varint,23,opt,name=UseTriton,proto3" json:"UseTriton,omitempty"`
	ModelBaseName    string `protobuf:"bytes,24,opt,name=ModelBaseName,proto3" json:"ModelBaseName,omitempty"`
	UseFastTokenizer bool   `protobuf:"varint,25,opt,name=UseFastTokenizer,proto3" json:"UseFastTokenizer,omitempty"`
	// Diffusers
	PipelineType  string  `protobuf:"bytes,26,opt,name=PipelineType,proto3" json:"PipelineType,omitempty"`
	SchedulerType string  `protobuf:"bytes,27,opt,name=SchedulerType,proto3" json:"SchedulerType,omitempty"`
	CUDA          bool    `protobuf:"varint,28,opt,name=CUDA,proto3" json:"CUDA,omitempty"`
	CFGScale      float32 `protobuf:"fixed32,29,opt,name=CFGScale,proto3" json:"CFGScale,omitempty"`
	IMG2IMG       bool    `protobuf:"varint,30,opt,name=IMG2IMG,proto3" json:"IMG2IMG,omitempty"`
	CLIPModel     string  `protobuf:"bytes,31,opt,name=CLIPModel,proto3" json:"CLIPModel,omitempty"`
	CLIPSubfolder string  `protobuf:"bytes,32,opt,name=CLIPSubfolder,proto3" json:"CLIPSubfolder,omitempty"`
	CLIPSkip      int32   `protobuf:"varint,33,opt,name=CLIPSkip,proto3" json:"CLIPSkip,omitempty"`
	// RWKV
	Tokenizer string `protobuf:"bytes,34,opt,name=Tokenizer,proto3" json:"Tokenizer,omitempty"`
	// LLM (llama.cpp)
	LoraBase    string `protobuf:"bytes,35,opt,name=LoraBase,proto3" json:"LoraBase,omitempty"`
	LoraAdapter string `protobuf:"bytes,36,opt,name=LoraAdapter,proto3" json:"LoraAdapter,omitempty"`
	NoMulMatQ   bool   `protobuf:"varint,37,opt,name=NoMulMatQ,proto3" json:"NoMulMatQ,omitempty"`
	// contains filtered or unexported fields
}

func (*ModelOptions) Descriptor deprecated

func (*ModelOptions) Descriptor() ([]byte, []int)

Deprecated: Use ModelOptions.ProtoReflect.Descriptor instead.

func (*ModelOptions) GetCFGScale added in v1.25.0

func (x *ModelOptions) GetCFGScale() float32

func (*ModelOptions) GetCLIPModel added in v1.25.0

func (x *ModelOptions) GetCLIPModel() string

func (*ModelOptions) GetCLIPSkip added in v1.25.0

func (x *ModelOptions) GetCLIPSkip() int32

func (*ModelOptions) GetCLIPSubfolder added in v1.25.0

func (x *ModelOptions) GetCLIPSubfolder() string

func (*ModelOptions) GetCUDA added in v1.24.1

func (x *ModelOptions) GetCUDA() bool

func (*ModelOptions) GetContextSize

func (x *ModelOptions) GetContextSize() int32

func (*ModelOptions) GetDevice added in v1.24.1

func (x *ModelOptions) GetDevice() string

func (*ModelOptions) GetEmbeddings

func (x *ModelOptions) GetEmbeddings() bool

func (*ModelOptions) GetF16Memory

func (x *ModelOptions) GetF16Memory() bool

func (*ModelOptions) GetIMG2IMG added in v1.25.0

func (x *ModelOptions) GetIMG2IMG() bool

func (*ModelOptions) GetLibrarySearchPath

func (x *ModelOptions) GetLibrarySearchPath() string

func (*ModelOptions) GetLoraAdapter added in v1.25.0

func (x *ModelOptions) GetLoraAdapter() string

func (*ModelOptions) GetLoraBase added in v1.25.0

func (x *ModelOptions) GetLoraBase() string

func (*ModelOptions) GetLowVRAM

func (x *ModelOptions) GetLowVRAM() bool

func (*ModelOptions) GetMLock

func (x *ModelOptions) GetMLock() bool

func (*ModelOptions) GetMMap

func (x *ModelOptions) GetMMap() bool

func (*ModelOptions) GetMainGPU

func (x *ModelOptions) GetMainGPU() string

func (*ModelOptions) GetModel

func (x *ModelOptions) GetModel() string

func (*ModelOptions) GetModelBaseName added in v1.24.1

func (x *ModelOptions) GetModelBaseName() string

func (*ModelOptions) GetModelFile added in v1.24.1

func (x *ModelOptions) GetModelFile() string

func (*ModelOptions) GetNBatch

func (x *ModelOptions) GetNBatch() int32

func (*ModelOptions) GetNGPULayers

func (x *ModelOptions) GetNGPULayers() int32

func (*ModelOptions) GetNGQA added in v1.23.2

func (x *ModelOptions) GetNGQA() int32

func (*ModelOptions) GetNUMA

func (x *ModelOptions) GetNUMA() bool

func (*ModelOptions) GetNoMulMatQ added in v1.25.0

func (x *ModelOptions) GetNoMulMatQ() bool

func (*ModelOptions) GetPipelineType added in v1.24.1

func (x *ModelOptions) GetPipelineType() string

func (*ModelOptions) GetRMSNormEps added in v1.23.2

func (x *ModelOptions) GetRMSNormEps() float32

func (*ModelOptions) GetRopeFreqBase added in v1.23.0

func (x *ModelOptions) GetRopeFreqBase() float32

func (*ModelOptions) GetRopeFreqScale added in v1.23.0

func (x *ModelOptions) GetRopeFreqScale() float32

func (*ModelOptions) GetSchedulerType added in v1.24.1

func (x *ModelOptions) GetSchedulerType() string

func (*ModelOptions) GetSeed

func (x *ModelOptions) GetSeed() int32

func (*ModelOptions) GetTensorSplit

func (x *ModelOptions) GetTensorSplit() string

func (*ModelOptions) GetThreads

func (x *ModelOptions) GetThreads() int32

func (*ModelOptions) GetTokenizer added in v1.25.0

func (x *ModelOptions) GetTokenizer() string

func (*ModelOptions) GetUseFastTokenizer added in v1.24.1

func (x *ModelOptions) GetUseFastTokenizer() bool

func (*ModelOptions) GetUseTriton added in v1.24.1

func (x *ModelOptions) GetUseTriton() bool

func (*ModelOptions) GetVocabOnly

func (x *ModelOptions) GetVocabOnly() bool

func (*ModelOptions) ProtoMessage

func (*ModelOptions) ProtoMessage()

func (*ModelOptions) ProtoReflect

func (x *ModelOptions) ProtoReflect() protoreflect.Message

func (*ModelOptions) Reset

func (x *ModelOptions) Reset()

func (*ModelOptions) String

func (x *ModelOptions) String() string

type PredictOptions

type PredictOptions struct {
	Prompt              string   `protobuf:"bytes,1,opt,name=Prompt,proto3" json:"Prompt,omitempty"`
	Seed                int32    `protobuf:"varint,2,opt,name=Seed,proto3" json:"Seed,omitempty"`
	Threads             int32    `protobuf:"varint,3,opt,name=Threads,proto3" json:"Threads,omitempty"`
	Tokens              int32    `protobuf:"varint,4,opt,name=Tokens,proto3" json:"Tokens,omitempty"`
	TopK                int32    `protobuf:"varint,5,opt,name=TopK,proto3" json:"TopK,omitempty"`
	Repeat              int32    `protobuf:"varint,6,opt,name=Repeat,proto3" json:"Repeat,omitempty"`
	Batch               int32    `protobuf:"varint,7,opt,name=Batch,proto3" json:"Batch,omitempty"`
	NKeep               int32    `protobuf:"varint,8,opt,name=NKeep,proto3" json:"NKeep,omitempty"`
	Temperature         float32  `protobuf:"fixed32,9,opt,name=Temperature,proto3" json:"Temperature,omitempty"`
	Penalty             float32  `protobuf:"fixed32,10,opt,name=Penalty,proto3" json:"Penalty,omitempty"`
	F16KV               bool     `protobuf:"varint,11,opt,name=F16KV,proto3" json:"F16KV,omitempty"`
	DebugMode           bool     `protobuf:"varint,12,opt,name=DebugMode,proto3" json:"DebugMode,omitempty"`
	StopPrompts         []string `protobuf:"bytes,13,rep,name=StopPrompts,proto3" json:"StopPrompts,omitempty"`
	IgnoreEOS           bool     `protobuf:"varint,14,opt,name=IgnoreEOS,proto3" json:"IgnoreEOS,omitempty"`
	TailFreeSamplingZ   float32  `protobuf:"fixed32,15,opt,name=TailFreeSamplingZ,proto3" json:"TailFreeSamplingZ,omitempty"`
	TypicalP            float32  `protobuf:"fixed32,16,opt,name=TypicalP,proto3" json:"TypicalP,omitempty"`
	FrequencyPenalty    float32  `protobuf:"fixed32,17,opt,name=FrequencyPenalty,proto3" json:"FrequencyPenalty,omitempty"`
	PresencePenalty     float32  `protobuf:"fixed32,18,opt,name=PresencePenalty,proto3" json:"PresencePenalty,omitempty"`
	Mirostat            int32    `protobuf:"varint,19,opt,name=Mirostat,proto3" json:"Mirostat,omitempty"`
	MirostatETA         float32  `protobuf:"fixed32,20,opt,name=MirostatETA,proto3" json:"MirostatETA,omitempty"`
	MirostatTAU         float32  `protobuf:"fixed32,21,opt,name=MirostatTAU,proto3" json:"MirostatTAU,omitempty"`
	PenalizeNL          bool     `protobuf:"varint,22,opt,name=PenalizeNL,proto3" json:"PenalizeNL,omitempty"`
	LogitBias           string   `protobuf:"bytes,23,opt,name=LogitBias,proto3" json:"LogitBias,omitempty"`
	MLock               bool     `protobuf:"varint,25,opt,name=MLock,proto3" json:"MLock,omitempty"`
	MMap                bool     `protobuf:"varint,26,opt,name=MMap,proto3" json:"MMap,omitempty"`
	PromptCacheAll      bool     `protobuf:"varint,27,opt,name=PromptCacheAll,proto3" json:"PromptCacheAll,omitempty"`
	PromptCacheRO       bool     `protobuf:"varint,28,opt,name=PromptCacheRO,proto3" json:"PromptCacheRO,omitempty"`
	Grammar             string   `protobuf:"bytes,29,opt,name=Grammar,proto3" json:"Grammar,omitempty"`
	MainGPU             string   `protobuf:"bytes,30,opt,name=MainGPU,proto3" json:"MainGPU,omitempty"`
	TensorSplit         string   `protobuf:"bytes,31,opt,name=TensorSplit,proto3" json:"TensorSplit,omitempty"`
	TopP                float32  `protobuf:"fixed32,32,opt,name=TopP,proto3" json:"TopP,omitempty"`
	PromptCachePath     string   `protobuf:"bytes,33,opt,name=PromptCachePath,proto3" json:"PromptCachePath,omitempty"`
	Debug               bool     `protobuf:"varint,34,opt,name=Debug,proto3" json:"Debug,omitempty"`
	EmbeddingTokens     []int32  `protobuf:"varint,35,rep,packed,name=EmbeddingTokens,proto3" json:"EmbeddingTokens,omitempty"`
	Embeddings          string   `protobuf:"bytes,36,opt,name=Embeddings,proto3" json:"Embeddings,omitempty"`
	RopeFreqBase        float32  `protobuf:"fixed32,37,opt,name=RopeFreqBase,proto3" json:"RopeFreqBase,omitempty"`
	RopeFreqScale       float32  `protobuf:"fixed32,38,opt,name=RopeFreqScale,proto3" json:"RopeFreqScale,omitempty"`
	NegativePromptScale float32  `protobuf:"fixed32,39,opt,name=NegativePromptScale,proto3" json:"NegativePromptScale,omitempty"`
	NegativePrompt      string   `protobuf:"bytes,40,opt,name=NegativePrompt,proto3" json:"NegativePrompt,omitempty"`
	// contains filtered or unexported fields
}

The request message containing the user's name.

func (*PredictOptions) Descriptor deprecated

func (*PredictOptions) Descriptor() ([]byte, []int)

Deprecated: Use PredictOptions.ProtoReflect.Descriptor instead.

func (*PredictOptions) GetBatch

func (x *PredictOptions) GetBatch() int32

func (*PredictOptions) GetDebug

func (x *PredictOptions) GetDebug() bool

func (*PredictOptions) GetDebugMode

func (x *PredictOptions) GetDebugMode() bool

func (*PredictOptions) GetEmbeddingTokens

func (x *PredictOptions) GetEmbeddingTokens() []int32

func (*PredictOptions) GetEmbeddings

func (x *PredictOptions) GetEmbeddings() string

func (*PredictOptions) GetF16KV

func (x *PredictOptions) GetF16KV() bool

func (*PredictOptions) GetFrequencyPenalty

func (x *PredictOptions) GetFrequencyPenalty() float32

func (*PredictOptions) GetGrammar

func (x *PredictOptions) GetGrammar() string

func (*PredictOptions) GetIgnoreEOS

func (x *PredictOptions) GetIgnoreEOS() bool

func (*PredictOptions) GetLogitBias

func (x *PredictOptions) GetLogitBias() string

func (*PredictOptions) GetMLock

func (x *PredictOptions) GetMLock() bool

func (*PredictOptions) GetMMap

func (x *PredictOptions) GetMMap() bool

func (*PredictOptions) GetMainGPU

func (x *PredictOptions) GetMainGPU() string

func (*PredictOptions) GetMirostat

func (x *PredictOptions) GetMirostat() int32

func (*PredictOptions) GetMirostatETA

func (x *PredictOptions) GetMirostatETA() float32

func (*PredictOptions) GetMirostatTAU

func (x *PredictOptions) GetMirostatTAU() float32

func (*PredictOptions) GetNKeep

func (x *PredictOptions) GetNKeep() int32

func (*PredictOptions) GetNegativePrompt added in v1.23.0

func (x *PredictOptions) GetNegativePrompt() string

func (*PredictOptions) GetNegativePromptScale added in v1.23.0

func (x *PredictOptions) GetNegativePromptScale() float32

func (*PredictOptions) GetPenalizeNL

func (x *PredictOptions) GetPenalizeNL() bool

func (*PredictOptions) GetPenalty

func (x *PredictOptions) GetPenalty() float32

func (*PredictOptions) GetPresencePenalty

func (x *PredictOptions) GetPresencePenalty() float32

func (*PredictOptions) GetPrompt

func (x *PredictOptions) GetPrompt() string

func (*PredictOptions) GetPromptCacheAll

func (x *PredictOptions) GetPromptCacheAll() bool

func (*PredictOptions) GetPromptCachePath

func (x *PredictOptions) GetPromptCachePath() string

func (*PredictOptions) GetPromptCacheRO

func (x *PredictOptions) GetPromptCacheRO() bool

func (*PredictOptions) GetRepeat

func (x *PredictOptions) GetRepeat() int32

func (*PredictOptions) GetRopeFreqBase added in v1.23.0

func (x *PredictOptions) GetRopeFreqBase() float32

func (*PredictOptions) GetRopeFreqScale added in v1.23.0

func (x *PredictOptions) GetRopeFreqScale() float32

func (*PredictOptions) GetSeed

func (x *PredictOptions) GetSeed() int32

func (*PredictOptions) GetStopPrompts

func (x *PredictOptions) GetStopPrompts() []string

func (*PredictOptions) GetTailFreeSamplingZ

func (x *PredictOptions) GetTailFreeSamplingZ() float32

func (*PredictOptions) GetTemperature

func (x *PredictOptions) GetTemperature() float32

func (*PredictOptions) GetTensorSplit

func (x *PredictOptions) GetTensorSplit() string

func (*PredictOptions) GetThreads

func (x *PredictOptions) GetThreads() int32

func (*PredictOptions) GetTokens

func (x *PredictOptions) GetTokens() int32

func (*PredictOptions) GetTopK

func (x *PredictOptions) GetTopK() int32

func (*PredictOptions) GetTopP

func (x *PredictOptions) GetTopP() float32

func (*PredictOptions) GetTypicalP

func (x *PredictOptions) GetTypicalP() float32

func (*PredictOptions) ProtoMessage

func (*PredictOptions) ProtoMessage()

func (*PredictOptions) ProtoReflect

func (x *PredictOptions) ProtoReflect() protoreflect.Message

func (*PredictOptions) Reset

func (x *PredictOptions) Reset()

func (*PredictOptions) String

func (x *PredictOptions) String() string

type Reply

type Reply struct {
	Message []byte `protobuf:"bytes,1,opt,name=message,proto3" json:"message,omitempty"`
	// contains filtered or unexported fields
}

The response message containing the result

func (*Reply) Descriptor deprecated

func (*Reply) Descriptor() ([]byte, []int)

Deprecated: Use Reply.ProtoReflect.Descriptor instead.

func (*Reply) GetMessage

func (x *Reply) GetMessage() []byte

func (*Reply) ProtoMessage

func (*Reply) ProtoMessage()

func (*Reply) ProtoReflect

func (x *Reply) ProtoReflect() protoreflect.Message

func (*Reply) Reset

func (x *Reply) Reset()

func (*Reply) String

func (x *Reply) String() string

type Result

type Result struct {
	Message string `protobuf:"bytes,1,opt,name=message,proto3" json:"message,omitempty"`
	Success bool   `protobuf:"varint,2,opt,name=success,proto3" json:"success,omitempty"`
	// contains filtered or unexported fields
}

func (*Result) Descriptor deprecated

func (*Result) Descriptor() ([]byte, []int)

Deprecated: Use Result.ProtoReflect.Descriptor instead.

func (*Result) GetMessage

func (x *Result) GetMessage() string

func (*Result) GetSuccess

func (x *Result) GetSuccess() bool

func (*Result) ProtoMessage

func (*Result) ProtoMessage()

func (*Result) ProtoReflect

func (x *Result) ProtoReflect() protoreflect.Message

func (*Result) Reset

func (x *Result) Reset()

func (*Result) String

func (x *Result) String() string

type StatusResponse added in v1.25.0

type StatusResponse struct {
	State  StatusResponse_State `protobuf:"varint,1,opt,name=state,proto3,enum=backend.StatusResponse_State" json:"state,omitempty"`
	Memory *MemoryUsageData     `protobuf:"bytes,2,opt,name=memory,proto3" json:"memory,omitempty"`
	// contains filtered or unexported fields
}

func (*StatusResponse) Descriptor deprecated added in v1.25.0

func (*StatusResponse) Descriptor() ([]byte, []int)

Deprecated: Use StatusResponse.ProtoReflect.Descriptor instead.

func (*StatusResponse) GetMemory added in v1.25.0

func (x *StatusResponse) GetMemory() *MemoryUsageData

func (*StatusResponse) GetState added in v1.25.0

func (x *StatusResponse) GetState() StatusResponse_State

func (*StatusResponse) ProtoMessage added in v1.25.0

func (*StatusResponse) ProtoMessage()

func (*StatusResponse) ProtoReflect added in v1.25.0

func (x *StatusResponse) ProtoReflect() protoreflect.Message

func (*StatusResponse) Reset added in v1.25.0

func (x *StatusResponse) Reset()

func (*StatusResponse) String added in v1.25.0

func (x *StatusResponse) String() string

type StatusResponse_State added in v1.25.0

type StatusResponse_State int32
const (
	StatusResponse_UNINITIALIZED StatusResponse_State = 0
	StatusResponse_BUSY          StatusResponse_State = 1
	StatusResponse_READY         StatusResponse_State = 2
	StatusResponse_ERROR         StatusResponse_State = -1
)

func (StatusResponse_State) Descriptor added in v1.25.0

func (StatusResponse_State) Enum added in v1.25.0

func (StatusResponse_State) EnumDescriptor deprecated added in v1.25.0

func (StatusResponse_State) EnumDescriptor() ([]byte, []int)

Deprecated: Use StatusResponse_State.Descriptor instead.

func (StatusResponse_State) Number added in v1.25.0

func (StatusResponse_State) String added in v1.25.0

func (x StatusResponse_State) String() string

func (StatusResponse_State) Type added in v1.25.0

type TTSRequest

type TTSRequest struct {
	Text  string `protobuf:"bytes,1,opt,name=text,proto3" json:"text,omitempty"`
	Model string `protobuf:"bytes,2,opt,name=model,proto3" json:"model,omitempty"`
	Dst   string `protobuf:"bytes,3,opt,name=dst,proto3" json:"dst,omitempty"`
	// contains filtered or unexported fields
}

func (*TTSRequest) Descriptor deprecated

func (*TTSRequest) Descriptor() ([]byte, []int)

Deprecated: Use TTSRequest.ProtoReflect.Descriptor instead.

func (*TTSRequest) GetDst

func (x *TTSRequest) GetDst() string

func (*TTSRequest) GetModel

func (x *TTSRequest) GetModel() string

func (*TTSRequest) GetText

func (x *TTSRequest) GetText() string

func (*TTSRequest) ProtoMessage

func (*TTSRequest) ProtoMessage()

func (*TTSRequest) ProtoReflect

func (x *TTSRequest) ProtoReflect() protoreflect.Message

func (*TTSRequest) Reset

func (x *TTSRequest) Reset()

func (*TTSRequest) String

func (x *TTSRequest) String() string

type TokenizationResponse added in v1.25.0

type TokenizationResponse struct {
	Length int32   `protobuf:"varint,1,opt,name=length,proto3" json:"length,omitempty"`
	Tokens []int32 `protobuf:"varint,2,rep,packed,name=tokens,proto3" json:"tokens,omitempty"`
	// contains filtered or unexported fields
}

func (*TokenizationResponse) Descriptor deprecated added in v1.25.0

func (*TokenizationResponse) Descriptor() ([]byte, []int)

Deprecated: Use TokenizationResponse.ProtoReflect.Descriptor instead.

func (*TokenizationResponse) GetLength added in v1.25.0

func (x *TokenizationResponse) GetLength() int32

func (*TokenizationResponse) GetTokens added in v1.25.0

func (x *TokenizationResponse) GetTokens() []int32

func (*TokenizationResponse) ProtoMessage added in v1.25.0

func (*TokenizationResponse) ProtoMessage()

func (*TokenizationResponse) ProtoReflect added in v1.25.0

func (x *TokenizationResponse) ProtoReflect() protoreflect.Message

func (*TokenizationResponse) Reset added in v1.25.0

func (x *TokenizationResponse) Reset()

func (*TokenizationResponse) String added in v1.25.0

func (x *TokenizationResponse) String() string

type TranscriptRequest

type TranscriptRequest struct {
	Dst      string `protobuf:"bytes,2,opt,name=dst,proto3" json:"dst,omitempty"`
	Language string `protobuf:"bytes,3,opt,name=language,proto3" json:"language,omitempty"`
	Threads  uint32 `protobuf:"varint,4,opt,name=threads,proto3" json:"threads,omitempty"`
	// contains filtered or unexported fields
}

func (*TranscriptRequest) Descriptor deprecated

func (*TranscriptRequest) Descriptor() ([]byte, []int)

Deprecated: Use TranscriptRequest.ProtoReflect.Descriptor instead.

func (*TranscriptRequest) GetDst

func (x *TranscriptRequest) GetDst() string

func (*TranscriptRequest) GetLanguage

func (x *TranscriptRequest) GetLanguage() string

func (*TranscriptRequest) GetThreads

func (x *TranscriptRequest) GetThreads() uint32

func (*TranscriptRequest) ProtoMessage

func (*TranscriptRequest) ProtoMessage()

func (*TranscriptRequest) ProtoReflect

func (x *TranscriptRequest) ProtoReflect() protoreflect.Message

func (*TranscriptRequest) Reset

func (x *TranscriptRequest) Reset()

func (*TranscriptRequest) String

func (x *TranscriptRequest) String() string

type TranscriptResult

type TranscriptResult struct {
	Segments []*TranscriptSegment `protobuf:"bytes,1,rep,name=segments,proto3" json:"segments,omitempty"`
	Text     string               `protobuf:"bytes,2,opt,name=text,proto3" json:"text,omitempty"`
	// contains filtered or unexported fields
}

func (*TranscriptResult) Descriptor deprecated

func (*TranscriptResult) Descriptor() ([]byte, []int)

Deprecated: Use TranscriptResult.ProtoReflect.Descriptor instead.

func (*TranscriptResult) GetSegments

func (x *TranscriptResult) GetSegments() []*TranscriptSegment

func (*TranscriptResult) GetText

func (x *TranscriptResult) GetText() string

func (*TranscriptResult) ProtoMessage

func (*TranscriptResult) ProtoMessage()

func (*TranscriptResult) ProtoReflect

func (x *TranscriptResult) ProtoReflect() protoreflect.Message

func (*TranscriptResult) Reset

func (x *TranscriptResult) Reset()

func (*TranscriptResult) String

func (x *TranscriptResult) String() string

type TranscriptSegment

type TranscriptSegment struct {
	Id     int32   `protobuf:"varint,1,opt,name=id,proto3" json:"id,omitempty"`
	Start  int64   `protobuf:"varint,2,opt,name=start,proto3" json:"start,omitempty"`
	End    int64   `protobuf:"varint,3,opt,name=end,proto3" json:"end,omitempty"`
	Text   string  `protobuf:"bytes,4,opt,name=text,proto3" json:"text,omitempty"`
	Tokens []int32 `protobuf:"varint,5,rep,packed,name=tokens,proto3" json:"tokens,omitempty"`
	// contains filtered or unexported fields
}

func (*TranscriptSegment) Descriptor deprecated

func (*TranscriptSegment) Descriptor() ([]byte, []int)

Deprecated: Use TranscriptSegment.ProtoReflect.Descriptor instead.

func (*TranscriptSegment) GetEnd

func (x *TranscriptSegment) GetEnd() int64

func (*TranscriptSegment) GetId

func (x *TranscriptSegment) GetId() int32

func (*TranscriptSegment) GetStart

func (x *TranscriptSegment) GetStart() int64

func (*TranscriptSegment) GetText

func (x *TranscriptSegment) GetText() string

func (*TranscriptSegment) GetTokens

func (x *TranscriptSegment) GetTokens() []int32

func (*TranscriptSegment) ProtoMessage

func (*TranscriptSegment) ProtoMessage()

func (*TranscriptSegment) ProtoReflect

func (x *TranscriptSegment) ProtoReflect() protoreflect.Message

func (*TranscriptSegment) Reset

func (x *TranscriptSegment) Reset()

func (*TranscriptSegment) String

func (x *TranscriptSegment) String() string

type UnimplementedBackendServer

type UnimplementedBackendServer struct {
}

UnimplementedBackendServer must be embedded to have forward compatible implementations.

func (UnimplementedBackendServer) AudioTranscription

func (UnimplementedBackendServer) Embedding

func (UnimplementedBackendServer) GenerateImage

func (UnimplementedBackendServer) Health

func (UnimplementedBackendServer) LoadModel

func (UnimplementedBackendServer) Predict

func (UnimplementedBackendServer) PredictStream

func (UnimplementedBackendServer) Status added in v1.25.0

func (UnimplementedBackendServer) TTS

func (UnimplementedBackendServer) TokenizeString added in v1.25.0

type UnsafeBackendServer

type UnsafeBackendServer interface {
	// contains filtered or unexported methods
}

UnsafeBackendServer may be embedded to opt out of forward compatibility for this service. Use of this interface is not recommended, as added methods to BackendServer will result in compilation errors.

Jump to

Keyboard shortcuts

? : This menu
/ : Search site
f or F : Jump to
y or Y : Canonical URL