@@ -21,16 +21,15 @@ import (
21
21
metav1 "k8s.io/apimachinery/pkg/apis/meta/v1"
22
22
)
23
23
24
- type InferenceMode string
25
-
26
- const (
27
- DefaultInferenceMode InferenceMode = "Default"
28
- SpeculativeDecodingInferenceMode InferenceMode = "SpeculativeDecoding"
29
- )
30
-
24
+ // BackendRuntimeArg is preset arguments for easy to use.
25
+ // Do not edit the preset names unless set the argument name explicitly
26
+ // in Playground backendRuntimeConfig.
31
27
type BackendRuntimeArg struct {
32
- Mode InferenceMode `json:"mode"`
33
- Flags []string `json:"flags,omitempty"`
28
+ // Name represents the identifier of the backendRuntime argument.
29
+ Name string `json:"name"`
30
+ // Flags represents all the preset configurations.
31
+ // Flag around with {{ .CONFIG }} is a configuration waiting for render.
32
+ Flags []string `json:"flags,omitempty"`
34
33
}
35
34
36
35
// BackendRuntimeSpec defines the desired state of BackendRuntime
@@ -43,11 +42,8 @@ type BackendRuntimeSpec struct {
43
42
// Version represents the default version of the backendRuntime.
44
43
// It will be appended to the image as a tag.
45
44
Version string `json:"version"`
46
- // Args represents the args of the backendRuntime.
47
- // They can be appended or overwritten by the Playground args.
48
- // The key is the inference option, like default one or advanced
49
- // speculativeDecoding, the values are the corresponding args.
50
- // Flag around with {{ .XXX }} is a flag waiting for render.
45
+ // Args represents the preset arguments of the backendRuntime.
46
+ // They can be appended or overwritten by the Playground backendRuntimeConfig.
51
47
Args []BackendRuntimeArg `json:"args,omitempty"`
52
48
// Envs represents the environments set to the container.
53
49
// +optional
0 commit comments