Documentation
¶
Overview ¶
Package v1alpha1 contains API Schema definitions for the inference v1alpha1 API group +kubebuilder:object:generate=true +groupName=inference.llmaz.io
Index ¶
- Constants
- Variables
- func Resource(resource string) schema.GroupResource
- type BackendName
- type BackendRuntime
- type BackendRuntimeArg
- type BackendRuntimeConfig
- type BackendRuntimeList
- type BackendRuntimeSpec
- type BackendRuntimeStatus
- type ElasticConfig
- type HPATrigger
- type MultiHostCommands
- type NamedScaleTrigger
- type Playground
- type PlaygroundList
- type PlaygroundSpec
- type PlaygroundStatus
- type ResourceRequirements
- type ScaleTrigger
- type ScaleTriggerRef
- type Service
- type ServiceList
- type ServiceSpec
- type ServiceStatus
Constants ¶
const ( // PlaygroundProgressing means the Playground is progressing now, such as waiting for the // inference service creation, rolling update or scaling up and down. PlaygroundProgressing = "Progressing" // PlaygroundAvailable indicates the corresponding inference service is available now. PlaygroundAvailable string = "Available" )
const ( // ServiceAvailable means the inferenceService is available and all the // workloads are running as expected. ServiceAvailable = "Available" // ServiceProgressing means the inferenceService is progressing now, such as // in creation, rolling update or scaling up and down. ServiceProgressing = "Progressing" )
const ( // InferenceServiceFlavorsAnnoKey is the annotation key for the flavors specified // in the inference service, the value is a comma-separated list of flavor names. InferenceServiceFlavorsAnnoKey = "llmaz.io/inference-service-flavors" )
Variables ¶
var ( // GroupVersion is group version used to register these objects GroupVersion = schema.GroupVersion{Group: "inference.llmaz.io", Version: "v1alpha1"} // SchemeGroupVersion is alias to GroupVersion for client-go libraries. // It is required by pkg/client/informers/externalversions/... SchemeGroupVersion = GroupVersion // SchemeBuilder is used to add go types to the GroupVersionKind scheme SchemeBuilder = &scheme.Builder{GroupVersion: GroupVersion} // AddToScheme adds the types in this group-version to the given scheme. AddToScheme = SchemeBuilder.AddToScheme )
Functions ¶
func Resource ¶
func Resource(resource string) schema.GroupResource
Resource is required by pkg/client/listers/...
Types ¶
type BackendRuntime ¶ added in v0.0.7
type BackendRuntime struct {
metav1.TypeMeta `json:",inline"`
metav1.ObjectMeta `json:"metadata,omitempty"`
Spec BackendRuntimeSpec `json:"spec,omitempty"`
Status BackendRuntimeStatus `json:"status,omitempty"`
}
BackendRuntime is the Schema for the backendRuntime API
func (*BackendRuntime) DeepCopy ¶ added in v0.0.7
func (in *BackendRuntime) DeepCopy() *BackendRuntime
DeepCopy is an autogenerated deepcopy function, copying the receiver, creating a new BackendRuntime.
func (*BackendRuntime) DeepCopyInto ¶ added in v0.0.7
func (in *BackendRuntime) DeepCopyInto(out *BackendRuntime)
DeepCopyInto is an autogenerated deepcopy function, copying the receiver, writing into out. in must be non-nil.
func (*BackendRuntime) DeepCopyObject ¶ added in v0.0.7
func (in *BackendRuntime) DeepCopyObject() runtime.Object
DeepCopyObject is an autogenerated deepcopy function, copying the receiver, creating a new runtime.Object.
type BackendRuntimeArg ¶ added in v0.0.7
type BackendRuntimeArg struct {
// Name represents the identifier of the backendRuntime argument.
// +kubebuilder:default=default
// +optional
Name *string `json:"name,omitempty"`
// Flags represents all the preset configurations.
// Flag around with {{ .CONFIG }} is a configuration waiting for render.
Flags []string `json:"flags,omitempty"`
}
BackendRuntimeArg is the preset arguments for easy to use. Three preset names are provided: default, speculative-decoding, model-parallelism, do not change the name.
func (*BackendRuntimeArg) DeepCopy ¶ added in v0.0.7
func (in *BackendRuntimeArg) DeepCopy() *BackendRuntimeArg
DeepCopy is an autogenerated deepcopy function, copying the receiver, creating a new BackendRuntimeArg.
func (*BackendRuntimeArg) DeepCopyInto ¶ added in v0.0.7
func (in *BackendRuntimeArg) DeepCopyInto(out *BackendRuntimeArg)
DeepCopyInto is an autogenerated deepcopy function, copying the receiver, writing into out. in must be non-nil.
type BackendRuntimeConfig ¶ added in v0.0.7
type BackendRuntimeConfig struct {
// Name represents the inference backend under the hood, e.g. vLLM.
// +kubebuilder:default=vllm
// +optional
Name *BackendName `json:"name,omitempty"`
// Version represents the backend version if you want a different one
// from the default version.
// +optional
Version *string `json:"version,omitempty"`
// Args represents the specified arguments of the backendRuntime,
// will be append to the backendRuntime.spec.Args.
Args *BackendRuntimeArg `json:"args,omitempty"`
// Envs represents the environments set to the container.
// +optional
Envs []corev1.EnvVar `json:"envs,omitempty"`
// Resources represents the resource requirements for backend, like cpu/mem,
// accelerators like GPU should not be defined here, but at the model flavors,
// or the values here will be overwritten.
Resources *ResourceRequirements `json:"resources,omitempty"`
}
func (*BackendRuntimeConfig) DeepCopy ¶ added in v0.0.7
func (in *BackendRuntimeConfig) DeepCopy() *BackendRuntimeConfig
DeepCopy is an autogenerated deepcopy function, copying the receiver, creating a new BackendRuntimeConfig.
func (*BackendRuntimeConfig) DeepCopyInto ¶ added in v0.0.7
func (in *BackendRuntimeConfig) DeepCopyInto(out *BackendRuntimeConfig)
DeepCopyInto is an autogenerated deepcopy function, copying the receiver, writing into out. in must be non-nil.
type BackendRuntimeList ¶ added in v0.0.7
type BackendRuntimeList struct {
metav1.TypeMeta `json:",inline"`
metav1.ListMeta `json:"metadata,omitempty"`
Items []BackendRuntime `json:"items"`
}
BackendRuntimeList contains a list of BackendRuntime
func (*BackendRuntimeList) DeepCopy ¶ added in v0.0.7
func (in *BackendRuntimeList) DeepCopy() *BackendRuntimeList
DeepCopy is an autogenerated deepcopy function, copying the receiver, creating a new BackendRuntimeList.
func (*BackendRuntimeList) DeepCopyInto ¶ added in v0.0.7
func (in *BackendRuntimeList) DeepCopyInto(out *BackendRuntimeList)
DeepCopyInto is an autogenerated deepcopy function, copying the receiver, writing into out. in must be non-nil.
func (*BackendRuntimeList) DeepCopyObject ¶ added in v0.0.7
func (in *BackendRuntimeList) DeepCopyObject() runtime.Object
DeepCopyObject is an autogenerated deepcopy function, copying the receiver, creating a new runtime.Object.
type BackendRuntimeSpec ¶ added in v0.0.7
type BackendRuntimeSpec struct {
// Commands represents the default commands for the backendRuntime.
// +optional
Commands []string `json:"commands,omitempty"`
// MultiHostCommands represents leader and worker commands for nodes with
// different roles.
// +optional
MultiHostCommands *MultiHostCommands `json:"multiHostCommands,omitempty"`
// Image represents the default image registry of the backendRuntime.
// It will work together with version to make up a real image.
Image string `json:"image"`
// Version represents the default version of the backendRuntime.
// It will be appended to the image as a tag.
Version string `json:"version"`
// Args represents the preset arguments of the backendRuntime.
// They can be appended or overwritten by the Playground backendRuntimeConfig.
Args []BackendRuntimeArg `json:"args,omitempty"`
// Envs represents the environments set to the container.
// +optional
Envs []corev1.EnvVar `json:"envs,omitempty"`
// Resources represents the resource requirements for backendRuntime, like cpu/mem,
// accelerators like GPU should not be defined here, but at the model flavors,
// or the values here will be overwritten.
Resources ResourceRequirements `json:"resources"`
// Periodic probe of backend liveness.
// Backend will be restarted if the probe fails.
// Cannot be updated.
// +optional
LivenessProbe *corev1.Probe `json:"livenessProbe,omitempty"`
// Periodic probe of backend readiness.
// Backend will be removed from service endpoints if the probe fails.
// +optional
ReadinessProbe *corev1.Probe `json:"readinessProbe,omitempty"`
// StartupProbe indicates that the Backend has successfully initialized.
// If specified, no other probes are executed until this completes successfully.
// If this probe fails, the backend will be restarted, just as if the livenessProbe failed.
// This can be used to provide different probe parameters at the beginning of a backend's lifecycle,
// when it might take a long time to load data or warm a cache, than during steady-state operation.
// +optional
StartupProbe *corev1.Probe `json:"startupProbe,omitempty"`
// ScaleTriggers represents a set of triggers preset to be used by Playground.
// If Playground not specify the scale trigger, the 0-index trigger will be used.
// +optional
ScaleTriggers []NamedScaleTrigger `json:"scaleTriggers,omitempty"`
}
BackendRuntimeSpec defines the desired state of BackendRuntime
func (*BackendRuntimeSpec) DeepCopy ¶ added in v0.0.7
func (in *BackendRuntimeSpec) DeepCopy() *BackendRuntimeSpec
DeepCopy is an autogenerated deepcopy function, copying the receiver, creating a new BackendRuntimeSpec.
func (*BackendRuntimeSpec) DeepCopyInto ¶ added in v0.0.7
func (in *BackendRuntimeSpec) DeepCopyInto(out *BackendRuntimeSpec)
DeepCopyInto is an autogenerated deepcopy function, copying the receiver, writing into out. in must be non-nil.
type BackendRuntimeStatus ¶ added in v0.0.7
type BackendRuntimeStatus struct {
// Conditions represents the Inference condition.
Conditions []metav1.Condition `json:"conditions,omitempty"`
}
BackendRuntimeStatus defines the observed state of BackendRuntime
func (*BackendRuntimeStatus) DeepCopy ¶ added in v0.0.7
func (in *BackendRuntimeStatus) DeepCopy() *BackendRuntimeStatus
DeepCopy is an autogenerated deepcopy function, copying the receiver, creating a new BackendRuntimeStatus.
func (*BackendRuntimeStatus) DeepCopyInto ¶ added in v0.0.7
func (in *BackendRuntimeStatus) DeepCopyInto(out *BackendRuntimeStatus)
DeepCopyInto is an autogenerated deepcopy function, copying the receiver, writing into out. in must be non-nil.
type ElasticConfig ¶
type ElasticConfig struct {
// MinReplicas indicates the minimum number of inference workloads based on the traffic.
// Default to 1.
// MinReplicas couldn't be 0 now, will support serverless in the future.
// +kubebuilder:default=1
// +optional
MinReplicas *int32 `json:"minReplicas,omitempty"`
// MaxReplicas indicates the maximum number of inference workloads based on the traffic.
// Default to nil means there's no limit for the instance number.
// +optional
MaxReplicas *int32 `json:"maxReplicas,omitempty"`
// ScaleTriggerRef refers to the configured scaleTrigger in the backendRuntime
// with tuned target value.
// ScaleTriggerRef and ScaleTrigger can't be set at the same time.
// +optional
ScaleTriggerRef *ScaleTriggerRef `json:"scaleTriggerRef,omitempty"`
// ScaleTrigger defines a set of triggers to scale the workloads.
// If not defined, trigger configured in backendRuntime will be used,
// otherwise, trigger defined here will overwrite the defaulted ones.
// ScaleTriggerRef and ScaleTrigger can't be set at the same time.
// +optional
ScaleTrigger *ScaleTrigger `json:"scaleTrigger,omitempty"`
}
func (*ElasticConfig) DeepCopy ¶
func (in *ElasticConfig) DeepCopy() *ElasticConfig
DeepCopy is an autogenerated deepcopy function, copying the receiver, creating a new ElasticConfig.
func (*ElasticConfig) DeepCopyInto ¶
func (in *ElasticConfig) DeepCopyInto(out *ElasticConfig)
DeepCopyInto is an autogenerated deepcopy function, copying the receiver, writing into out. in must be non-nil.
type HPATrigger ¶ added in v0.1.0
type HPATrigger struct {
// metrics contains the specifications for which to use to calculate the
// desired replica count (the maximum replica count across all metrics will
// be used). The desired replica count is calculated multiplying the
// ratio between the target value and the current value by the current
// number of pods. Ergo, metrics used must decrease as the pod count is
// increased, and vice-versa. See the individual metric source types for
// more information about how each type of metric must respond.
// +optional
Metrics []autoscalingv2.MetricSpec `json:"metrics,omitempty"`
// behavior configures the scaling behavior of the target
// in both Up and Down directions (scaleUp and scaleDown fields respectively).
// If not set, the default HPAScalingRules for scale up and scale down are used.
// +optional
Behavior *autoscalingv2.HorizontalPodAutoscalerBehavior `json:"behavior,omitempty"`
}
HPATrigger represents the configuration of the HorizontalPodAutoscaler. Inspired by kubernetes.io/pkg/apis/autoscaling/types.go#HorizontalPodAutoscalerSpec. Note: HPA component should be installed in prior.
func (*HPATrigger) DeepCopy ¶ added in v0.1.0
func (in *HPATrigger) DeepCopy() *HPATrigger
DeepCopy is an autogenerated deepcopy function, copying the receiver, creating a new HPATrigger.
func (*HPATrigger) DeepCopyInto ¶ added in v0.1.0
func (in *HPATrigger) DeepCopyInto(out *HPATrigger)
DeepCopyInto is an autogenerated deepcopy function, copying the receiver, writing into out. in must be non-nil.
type MultiHostCommands ¶ added in v0.1.0
type MultiHostCommands struct {
Leader []string `json:"leader,omitempty"`
Worker []string `json:"worker,omitempty"`
}
MultiHostCommands represents leader & worker commands for multiple nodes scenarios.
func (*MultiHostCommands) DeepCopy ¶ added in v0.1.0
func (in *MultiHostCommands) DeepCopy() *MultiHostCommands
DeepCopy is an autogenerated deepcopy function, copying the receiver, creating a new MultiHostCommands.
func (*MultiHostCommands) DeepCopyInto ¶ added in v0.1.0
func (in *MultiHostCommands) DeepCopyInto(out *MultiHostCommands)
DeepCopyInto is an autogenerated deepcopy function, copying the receiver, writing into out. in must be non-nil.
type NamedScaleTrigger ¶ added in v0.1.0
type NamedScaleTrigger struct {
// Name represents the identifier of the scale trigger, e.g. some triggers defined for
// latency sensitive workloads, some are defined for throughput sensitive workloads.
Name string `json:"name,omitempty"`
// HPA represents the trigger configuration of the HorizontalPodAutoscaler.
HPA *HPATrigger `json:"hpa,omitempty"`
}
NamedScaleTrigger defines the rules to scale the workloads. Only one trigger cloud work at a time. The name is used to identify the trigger in backendRuntime.
func (*NamedScaleTrigger) DeepCopy ¶ added in v0.1.0
func (in *NamedScaleTrigger) DeepCopy() *NamedScaleTrigger
DeepCopy is an autogenerated deepcopy function, copying the receiver, creating a new NamedScaleTrigger.
func (*NamedScaleTrigger) DeepCopyInto ¶ added in v0.1.0
func (in *NamedScaleTrigger) DeepCopyInto(out *NamedScaleTrigger)
DeepCopyInto is an autogenerated deepcopy function, copying the receiver, writing into out. in must be non-nil.
type Playground ¶
type Playground struct {
metav1.TypeMeta `json:",inline"`
metav1.ObjectMeta `json:"metadata,omitempty"`
Spec PlaygroundSpec `json:"spec,omitempty"`
Status PlaygroundStatus `json:"status,omitempty"`
}
Playground is the Schema for the playgrounds API
func (*Playground) DeepCopy ¶
func (in *Playground) DeepCopy() *Playground
DeepCopy is an autogenerated deepcopy function, copying the receiver, creating a new Playground.
func (*Playground) DeepCopyInto ¶
func (in *Playground) DeepCopyInto(out *Playground)
DeepCopyInto is an autogenerated deepcopy function, copying the receiver, writing into out. in must be non-nil.
func (*Playground) DeepCopyObject ¶
func (in *Playground) DeepCopyObject() runtime.Object
DeepCopyObject is an autogenerated deepcopy function, copying the receiver, creating a new runtime.Object.
type PlaygroundList ¶
type PlaygroundList struct {
metav1.TypeMeta `json:",inline"`
metav1.ListMeta `json:"metadata,omitempty"`
Items []Playground `json:"items"`
}
PlaygroundList contains a list of Playground
func (*PlaygroundList) DeepCopy ¶
func (in *PlaygroundList) DeepCopy() *PlaygroundList
DeepCopy is an autogenerated deepcopy function, copying the receiver, creating a new PlaygroundList.
func (*PlaygroundList) DeepCopyInto ¶
func (in *PlaygroundList) DeepCopyInto(out *PlaygroundList)
DeepCopyInto is an autogenerated deepcopy function, copying the receiver, writing into out. in must be non-nil.
func (*PlaygroundList) DeepCopyObject ¶
func (in *PlaygroundList) DeepCopyObject() runtime.Object
DeepCopyObject is an autogenerated deepcopy function, copying the receiver, creating a new runtime.Object.
type PlaygroundSpec ¶
type PlaygroundSpec struct {
// Replicas represents the replica number of inference workloads.
// +kubebuilder:default=1
// +optional
Replicas *int32 `json:"replicas,omitempty"`
// ModelClaim represents claiming for one model, it's a simplified use case
// of modelClaims. Most of the time, modelClaim is enough.
// ModelClaim and modelClaims are exclusive configured.
// +optional
ModelClaim *coreapi.ModelClaim `json:"modelClaim,omitempty"`
// ModelClaims represents claiming for multiple models for more complicated
// use cases like speculative-decoding.
// ModelClaims and modelClaim are exclusive configured.
// +optional
ModelClaims *coreapi.ModelClaims `json:"modelClaims,omitempty"`
// BackendRuntimeConfig represents the inference backendRuntime configuration
// under the hood, e.g. vLLM, which is the default backendRuntime.
// +optional
BackendRuntimeConfig *BackendRuntimeConfig `json:"backendRuntimeConfig,omitempty"`
// ElasticConfig defines the configuration for elastic usage,
// e.g. the max/min replicas.
// Note: this requires to install the HPA first or will report error.
// +optional
ElasticConfig *ElasticConfig `json:"elasticConfig,omitempty"`
}
PlaygroundSpec defines the desired state of Playground
func (*PlaygroundSpec) DeepCopy ¶
func (in *PlaygroundSpec) DeepCopy() *PlaygroundSpec
DeepCopy is an autogenerated deepcopy function, copying the receiver, creating a new PlaygroundSpec.
func (*PlaygroundSpec) DeepCopyInto ¶
func (in *PlaygroundSpec) DeepCopyInto(out *PlaygroundSpec)
DeepCopyInto is an autogenerated deepcopy function, copying the receiver, writing into out. in must be non-nil.
type PlaygroundStatus ¶
type PlaygroundStatus struct {
// Conditions represents the Inference condition.
Conditions []metav1.Condition `json:"conditions,omitempty"`
// Replicas track the replicas that have been created, whether ready or not.
Replicas int32 `json:"replicas"`
// Selector points to the string form of a label selector which will be used by HPA.
Selector string `json:"selector,omitempty"`
}
PlaygroundStatus defines the observed state of Playground
func (*PlaygroundStatus) DeepCopy ¶
func (in *PlaygroundStatus) DeepCopy() *PlaygroundStatus
DeepCopy is an autogenerated deepcopy function, copying the receiver, creating a new PlaygroundStatus.
func (*PlaygroundStatus) DeepCopyInto ¶
func (in *PlaygroundStatus) DeepCopyInto(out *PlaygroundStatus)
DeepCopyInto is an autogenerated deepcopy function, copying the receiver, writing into out. in must be non-nil.
type ResourceRequirements ¶
type ResourceRequirements struct {
// Limits describes the maximum amount of compute resources allowed.
// More info: https://kubernetes.io/docs/concepts/configuration/manage-resources-containers/
// +optional
Limits corev1.ResourceList `json:"limits,omitempty"`
// Requests describes the minimum amount of compute resources required.
// If Requests is omitted for a container, it defaults to Limits if that is explicitly specified,
// otherwise to an implementation-defined value. Requests cannot exceed Limits.
// More info: https://kubernetes.io/docs/concepts/configuration/manage-resources-containers/
// +optional
Requests corev1.ResourceList `json:"requests,omitempty"`
}
TODO: Do not support DRA yet, we can support that once needed.
func (*ResourceRequirements) DeepCopy ¶
func (in *ResourceRequirements) DeepCopy() *ResourceRequirements
DeepCopy is an autogenerated deepcopy function, copying the receiver, creating a new ResourceRequirements.
func (*ResourceRequirements) DeepCopyInto ¶
func (in *ResourceRequirements) DeepCopyInto(out *ResourceRequirements)
DeepCopyInto is an autogenerated deepcopy function, copying the receiver, writing into out. in must be non-nil.
type ScaleTrigger ¶ added in v0.1.0
type ScaleTrigger struct {
// HPA represents the trigger configuration of the HorizontalPodAutoscaler.
HPA *HPATrigger `json:"hpa,omitempty"`
}
ScaleTrigger defines the rules to scale the workloads. Only one trigger cloud work at a time, mostly used in Playground.
func (*ScaleTrigger) DeepCopy ¶ added in v0.1.0
func (in *ScaleTrigger) DeepCopy() *ScaleTrigger
DeepCopy is an autogenerated deepcopy function, copying the receiver, creating a new ScaleTrigger.
func (*ScaleTrigger) DeepCopyInto ¶ added in v0.1.0
func (in *ScaleTrigger) DeepCopyInto(out *ScaleTrigger)
DeepCopyInto is an autogenerated deepcopy function, copying the receiver, writing into out. in must be non-nil.
type ScaleTriggerRef ¶ added in v0.1.0
type ScaleTriggerRef struct {
// Name represents the scale trigger name defined in the backendRuntime.scaleTriggers.
Name string `json:"name"`
}
ScaleTriggerRef refers to the configured scaleTrigger in the backendRuntime.
func (*ScaleTriggerRef) DeepCopy ¶ added in v0.1.0
func (in *ScaleTriggerRef) DeepCopy() *ScaleTriggerRef
DeepCopy is an autogenerated deepcopy function, copying the receiver, creating a new ScaleTriggerRef.
func (*ScaleTriggerRef) DeepCopyInto ¶ added in v0.1.0
func (in *ScaleTriggerRef) DeepCopyInto(out *ScaleTriggerRef)
DeepCopyInto is an autogenerated deepcopy function, copying the receiver, writing into out. in must be non-nil.
type Service ¶
type Service struct {
metav1.TypeMeta `json:",inline"`
metav1.ObjectMeta `json:"metadata,omitempty"`
Spec ServiceSpec `json:"spec,omitempty"`
Status ServiceStatus `json:"status,omitempty"`
}
Service is the Schema for the services API
func (*Service) DeepCopy ¶
DeepCopy is an autogenerated deepcopy function, copying the receiver, creating a new Service.
func (*Service) DeepCopyInto ¶
DeepCopyInto is an autogenerated deepcopy function, copying the receiver, writing into out. in must be non-nil.
func (*Service) DeepCopyObject ¶
DeepCopyObject is an autogenerated deepcopy function, copying the receiver, creating a new runtime.Object.
type ServiceList ¶
type ServiceList struct {
metav1.TypeMeta `json:",inline"`
metav1.ListMeta `json:"metadata,omitempty"`
Items []Service `json:"items"`
}
ServiceList contains a list of Service
func (*ServiceList) DeepCopy ¶
func (in *ServiceList) DeepCopy() *ServiceList
DeepCopy is an autogenerated deepcopy function, copying the receiver, creating a new ServiceList.
func (*ServiceList) DeepCopyInto ¶
func (in *ServiceList) DeepCopyInto(out *ServiceList)
DeepCopyInto is an autogenerated deepcopy function, copying the receiver, writing into out. in must be non-nil.
func (*ServiceList) DeepCopyObject ¶
func (in *ServiceList) DeepCopyObject() runtime.Object
DeepCopyObject is an autogenerated deepcopy function, copying the receiver, creating a new runtime.Object.
type ServiceSpec ¶
type ServiceSpec struct {
// ModelClaims represents multiple claims for different models.
ModelClaims coreapi.ModelClaims `json:"modelClaims,omitempty"`
// WorkloadTemplate defines the underlying workload layout and configuration.
// Note: the LWS spec might be twisted with various LWS instances to support
// accelerator fungibility or other cutting-edge researches.
// LWS supports both single-host and multi-host scenarios, for single host
// cases, only need to care about replicas, rolloutStrategy and workerTemplate.
WorkloadTemplate lws.LeaderWorkerSetSpec `json:"workloadTemplate"`
}
ServiceSpec defines the desired state of Service. Service controller will maintain multi-flavor of workloads with different accelerators for cost or performance considerations.
func (*ServiceSpec) DeepCopy ¶
func (in *ServiceSpec) DeepCopy() *ServiceSpec
DeepCopy is an autogenerated deepcopy function, copying the receiver, creating a new ServiceSpec.
func (*ServiceSpec) DeepCopyInto ¶
func (in *ServiceSpec) DeepCopyInto(out *ServiceSpec)
DeepCopyInto is an autogenerated deepcopy function, copying the receiver, writing into out. in must be non-nil.
type ServiceStatus ¶
type ServiceStatus struct {
// Conditions represents the Inference condition.
Conditions []metav1.Condition `json:"conditions,omitempty"`
// Replicas track the replicas that have been created, whether ready or not.
Replicas int32 `json:"replicas"`
// Selector points to the string form of a label selector, the HPA will be
// able to autoscale your resource.
Selector string `json:"selector,omitempty"`
}
ServiceStatus defines the observed state of Service
func (*ServiceStatus) DeepCopy ¶
func (in *ServiceStatus) DeepCopy() *ServiceStatus
DeepCopy is an autogenerated deepcopy function, copying the receiver, creating a new ServiceStatus.
func (*ServiceStatus) DeepCopyInto ¶
func (in *ServiceStatus) DeepCopyInto(out *ServiceStatus)
DeepCopyInto is an autogenerated deepcopy function, copying the receiver, writing into out. in must be non-nil.