Documentation
¶
Index ¶
Constants ¶
This section is empty.
Variables ¶
This section is empty.
Functions ¶
This section is empty.
Types ¶
type AuthConfig ¶
type AuthConfig struct {
Enable bool `yaml:"enable"`
RBACInternalServerAddr string `yaml:"rbacInternalServerAddr"`
}
AuthConfig is the authentication configuration.
type Config ¶
type Config struct {
GRPCPort int `yaml:"grpcPort"`
HTTPPort int `yaml:"httpPort"`
WorkerServiceGRPCPort int `yaml:"workerServiceGrpcPort"`
MonitoringPort int `yaml:"monitoringPort"`
AdminPort int `yaml:"adminPort"`
InternalGRPCPort int `yaml:"internalGrpcPort"`
ManagementPort int `yaml:"managementPort"`
ManagementGRPCPort int `yaml:"managementGrpcPort"`
// GracefulShutdownDelay is the delay before shutting down the server.
GracefulShutdownDelay time.Duration `yaml:"gracefulShutdownDelay"`
ModelManagerServerAddr string `yaml:"modelManagerServerAddr"`
VectorStoreManagerServerAddr string `yaml:"vectorStoreManagerServerAddr"`
VectorStoreManagerInternalServerAddr string `yaml:"vectorStoreManagerInternalServerAddr"`
AuthConfig AuthConfig `yaml:"auth"`
WorkerServiceTLS *TLS `yaml:"workerServiceTls"`
UsageSender sender.Config `yaml:"usageSender"`
RateLimit rate.Config `yaml:"rateLimit"`
RequestRouting RequestRoutingConfig `yaml:"requestRouting"`
KubernetesManager KubernetesManagerConfig `yaml:"kubernetesManager"`
// GracefulShutdownTimeout is the duration given to runnable to stop
// before the manager actually returns on stop.
GracefulShutdownTimeout time.Duration `yaml:"gracefulShutdownTimeout"`
EngineHeartbeat EngineHeartbeatConfig `yaml:"engineHeartbeat"`
// ServerPodLabelKey is the key of the label that the server pod has.
ServerPodLabelKey string `yaml:"serverPodLabelKey"`
// ServerPodLabelKey is the value of the label that the server pod has for ServerPodLabelKey.
ServerPodLabelValue string `yaml:"serverPodLabelValue"`
Debug DebugConfig `yaml:"debug"`
NIMModels []string `yaml:"nimModels"`
}
Config is the configuration.
type DebugConfig ¶
type DebugConfig struct {
UseNoopClient bool `yaml:"useNoopClient"`
}
DebugConfig is the debug configuration.
type EngineHeartbeatConfig ¶ added in v1.27.0
type EngineHeartbeatConfig struct {
Enable bool `yaml:"enable"`
Interval time.Duration `yaml:"interval"`
Timeout time.Duration `yaml:"timeout"`
}
EngineHeartbeatConfig is the engine heartbeat configuration.
type KubernetesManagerConfig ¶ added in v1.4.0
type KubernetesManagerConfig struct {
EnableLeaderElection bool `yaml:"enableLeaderElection"`
LeaderElectionID string `yaml:"leaderElectionID"`
MetricsBindAddress string `yaml:"metricsBindAddress"`
HealthBindAddress string `yaml:"healthBindAddress"`
PprofBindAddress string `yaml:"pprofBindAddress"`
}
KubernetesManagerConfig is the Kubernetes manager configuration.
type RequestRoutingConfig ¶ added in v1.6.0
type RequestRoutingConfig struct {
// EnableDynamicModelLoading specifies whether dynamic on-demand model loading is enabled.
EnableDynamicModelLoading bool `yaml:"enableDynamicModelLoading"`
}
RequestRoutingConfig is the request routing configuration.
Click to show internal directories.
Click to hide internal directories.