@@ -21,16 +21,15 @@ import (
2121 metav1 "k8s.io/apimachinery/pkg/apis/meta/v1"
2222)
2323
24- type InferenceMode string
25-
26- const (
27- DefaultInferenceMode InferenceMode = "Default"
28- SpeculativeDecodingInferenceMode InferenceMode = "SpeculativeDecoding"
29- )
30-
24+ // BackendRuntimeArg is preset arguments for easy to use.
25+ // Do not edit the preset names unless set the argument name explicitly
26+ // in Playground backendRuntimeConfig.
3127type BackendRuntimeArg struct {
32- Mode InferenceMode `json:"mode"`
33- Flags []string `json:"flags,omitempty"`
28+ // Name represents the identifier of the backendRuntime argument.
29+ Name string `json:"name"`
30+ // Flags represents all the preset configurations.
31+ // Flag around with {{ .CONFIG }} is a configuration waiting for render.
32+ Flags []string `json:"flags,omitempty"`
3433}
3534
3635// BackendRuntimeSpec defines the desired state of BackendRuntime
@@ -43,11 +42,8 @@ type BackendRuntimeSpec struct {
4342 // Version represents the default version of the backendRuntime.
4443 // It will be appended to the image as a tag.
4544 Version string `json:"version"`
46- // Args represents the args of the backendRuntime.
47- // They can be appended or overwritten by the Playground args.
48- // The key is the inference option, like default one or advanced
49- // speculativeDecoding, the values are the corresponding args.
50- // Flag around with {{ .XXX }} is a flag waiting for render.
45+ // Args represents the preset arguments of the backendRuntime.
46+ // They can be appended or overwritten by the Playground backendRuntimeConfig.
5147 Args []BackendRuntimeArg `json:"args,omitempty"`
5248 // Envs represents the environments set to the container.
5349 // +optional
0 commit comments