File tree Expand file tree Collapse file tree 4 files changed +11
-6
lines changed
config/charts/inferencepool Expand file tree Collapse file tree 4 files changed +11
-6
lines changed Original file line number Diff line number Diff line change @@ -348,6 +348,8 @@ func (r *Runner) parsePluginsConfiguration(ctx context.Context) error {
348
348
return fmt .Errorf ("failed to load the configuration - %w" , err )
349
349
}
350
350
351
+ setupLog .Info ("Configuration file loaded" , "config" , config )
352
+
351
353
r .schedulerConfig , err = loader .LoadSchedulerConfig (config .SchedulingProfiles , handle )
352
354
if err != nil {
353
355
return fmt .Errorf ("failed to create Scheduler configuration - %w" , err )
Original file line number Diff line number Diff line change 79
79
- pluginRef: prefix-cache-scorer
80
80
weight: 1
81
81
- pluginRef: max-score-picker
82
- {{- if (hasKey .Values.inferenceExtension "additionalConfigs ") }}
83
- {{- .Values.inferenceExtension.additionalConfigs | toYaml | nindent 2 }}
82
+ {{- if (hasKey .Values.inferenceExtension "pluginsCustomConfig ") }}
83
+ {{- .Values.inferenceExtension.pluginsCustomConfig | toYaml | nindent 2 }}
84
84
{{- end }}
85
85
Original file line number Diff line number Diff line change 36
36
- -metricsPort
37
37
- " 9090"
38
38
- -configFile
39
- - {{ .Values.inferenceExtension.configFile }}
39
+ - " config/ {{ .Values.inferenceExtension.pluginsConfigFile }}"
40
40
# https://pkg.go.dev/flag#hdr-Command_line_flag_syntax; space is only for non-bool flags
41
41
- " -enablePprof={{ .Values.inferenceExtension.enablePprof }}"
42
42
{{- if eq (.Values.inferencePool.modelServerType | default "vllm") "triton-tensorrt-llm" }}
Original file line number Diff line number Diff line change @@ -8,9 +8,10 @@ inferenceExtension:
8
8
extProcPort : 9002
9
9
env : {}
10
10
enablePprof : true # Enable pprof handlers for profiling and debugging
11
- configFile : " /config/default-plugins.yaml"
12
- # additionalConfigs:
13
- # custom-config.yaml: |
11
+ # This is the plugins configuration file.
12
+ pluginsConfigFile : " default-plugins.yaml"
13
+ # pluginsCustomConfig:
14
+ # custom-plugins.yaml: |
14
15
# apiVersion: inference.networking.x-k8s.io/v1alpha1
15
16
# kind: EndpointPickerConfig
16
17
# plugins:
@@ -23,7 +24,9 @@ inferenceExtension:
23
24
# - name: default
24
25
# plugins:
25
26
# - pluginRef: custom-scorer
27
+ # weight: 1
26
28
# - pluginRef: max-score-picker
29
+ # weight: 1
27
30
28
31
# Example environment variables:
29
32
# env:
You can’t perform that action at this time.
0 commit comments