@@ -103,7 +103,7 @@ func TestGetArgs(t *testing.T) {
103103 },
104104 },
105105 {
106- name : "with model context size ( takes precedence) " ,
106+ name : "backend config takes precedence over model config " ,
107107 bundle : & mockModelBundle {
108108 safetensorsPath : "/path/to/model/model.safetensors" ,
109109 runtimeConfig : & types.Config {
@@ -114,6 +114,29 @@ func TestGetArgs(t *testing.T) {
114114 config : & inference.BackendConfiguration {
115115 ContextSize : int32ptr (8192 ),
116116 },
117+ expected : []string {
118+ "-m" ,
119+ "sglang.launch_server" ,
120+ "--model-path" ,
121+ "/path/to/model" ,
122+ "--host" ,
123+ "127.0.0.1" ,
124+ "--port" ,
125+ "30000" ,
126+ "--context-length" ,
127+ "8192" ,
128+ },
129+ },
130+ {
131+ name : "model config used when no backend config" ,
132+ bundle : & mockModelBundle {
133+ safetensorsPath : "/path/to/model/model.safetensors" ,
134+ runtimeConfig : & types.Config {
135+ ContextSize : int32ptr (16384 ),
136+ },
137+ },
138+ mode : inference .BackendModeCompletion ,
139+ config : nil ,
117140 expected : []string {
118141 "-m" ,
119142 "sglang.launch_server" ,
@@ -225,14 +248,14 @@ func TestGetContextLength(t *testing.T) {
225248 expectedValue : int32ptr (8192 ),
226249 },
227250 {
228- name : "model config takes precedence" ,
251+ name : "backend config takes precedence" ,
229252 modelCfg : & types.Config {
230253 ContextSize : int32ptr (16384 ),
231254 },
232255 backendCfg : & inference.BackendConfiguration {
233256 ContextSize : int32ptr (4096 ),
234257 },
235- expectedValue : int32ptr (16384 ),
258+ expectedValue : int32ptr (4096 ),
236259 },
237260 {
238261 name : "zero context size in backend config returns nil" ,
0 commit comments