Documentation
¶
Index ¶
- Constants
- Variables
- func Init()
- func NewLeastBusyTimeRouter() (types.Router, error)
- func NewLeastExpectedLatencyRouter() (types.Router, error)
- func NewLeastKvCacheRouter() (types.Router, error)
- func NewLeastRequestRouter() (types.Router, error)
- func NewPrefixCacheAndLoadRouter() (types.Router, error)
- func NewPrefixCacheRouter() (types.Router, error)
- func NewRandomRouter() (types.Router, error)
- func NewThroughputRouter() (types.Router, error)
- func Register(algorithm types.RoutingAlgorithm, provider types.RouterProviderFunc)
- func RegisterDelayed(algorithm types.RoutingAlgorithm, ...)
- func RegisterDelayedConstructor(algorithm types.RoutingAlgorithm, routerConstructor types.RouterConstructor)
- func Select(algorithms types.RoutingAlgorithm) types.RouterProviderFunc
- func SelectRandomPodAsFallback(ctx *types.RoutingContext, pods []*v1.Pod, randomFunc func(int) int) (*v1.Pod, error)
- func Validate(algorithms string) (types.RoutingAlgorithm, bool)
- type PrefillTimeParams
- type SlidingWindowHistogram
Constants ¶
View Source
const (
RouterNotSet = ""
)
Variables ¶
View Source
var (
RouterLeastBusyTime types.RoutingAlgorithm = "least-busy-time"
)
View Source
var (
RouterLeastKvCache types.RoutingAlgorithm = "least-kv-cache"
)
View Source
var (
RouterLeastLatency types.RoutingAlgorithm = "least-latency"
)
View Source
var (
RouterLeastRequest types.RoutingAlgorithm = "least-request"
)
View Source
var (
RouterPrefixCache types.RoutingAlgorithm = "prefix-cache"
)
View Source
var (
RouterPrefixCacheAndLoad types.RoutingAlgorithm = "prefix-cache-preble"
)
View Source
var (
RouterRandom types.RoutingAlgorithm = "random"
)
View Source
var (
RouterThroughput types.RoutingAlgorithm = "throughput"
)
Functions ¶
func NewLeastBusyTimeRouter ¶
func NewLeastKvCacheRouter ¶
func NewLeastRequestRouter ¶
func NewPrefixCacheRouter ¶
func NewRandomRouter ¶
func NewThroughputRouter ¶
func Register ¶
func Register(algorithm types.RoutingAlgorithm, provider types.RouterProviderFunc)
func RegisterDelayed ¶
func RegisterDelayed(algorithm types.RoutingAlgorithm, delayedProvider types.RouterProviderRegistrationFunc)
func RegisterDelayedConstructor ¶
func RegisterDelayedConstructor(algorithm types.RoutingAlgorithm, routerConstructor types.RouterConstructor)
func Select ¶
func Select(algorithms types.RoutingAlgorithm) types.RouterProviderFunc
Select the user provided router provider supported by gateway, no error reported and fallback to random router Call Validate before this function to ensure expected behavior.
func SelectRandomPodAsFallback ¶
func SelectRandomPodAsFallback(ctx *types.RoutingContext, pods []*v1.Pod, randomFunc func(int) int) (*v1.Pod, error)
SelectRandomPodAsFallback selects a pod randomly as a fallback. This method should only be used when all other selection mechanisms have failed. For example, if no pods meet the required criteria (e.g., valid metrics or specific conditions), this method can be called to randomly select a pod from the provided list.
Types ¶
type PrefillTimeParams ¶
type SlidingWindowHistogram ¶
type SlidingWindowHistogram struct {
// contains filtered or unexported fields
}
Source Files
¶
Click to show internal directories.
Click to hide internal directories.