Skip to content

Commit 5f75e6f

Browse files
committed
Trying to save space
tiny is is not so tiny, it's 600M Signed-off-by: Eric Curtin <[email protected]>
1 parent 1af46a2 commit 5f75e6f

File tree

1 file changed

+20
-17
lines changed

1 file changed

+20
-17
lines changed

test/system/040-serve.bats

Lines changed: 20 additions & 17 deletions
Original file line numberDiff line numberDiff line change
@@ -178,25 +178,27 @@ verify_begin=".*run --rm"
178178
}
179179

180180
@test "ramalama serve --generate=quadlet" {
181-
model=tiny
181+
model="smollm"
182+
model_quant="$model:135m"
183+
quadlet="$model.container"
182184
name=c_$(safename)
183-
run_ramalama pull ${model}
184-
run_ramalama -q serve --port 1234 --generate=quadlet ${model}
185-
is "$output" "Generating quadlet file: tinyllama.container" "generate tinllama.container"
185+
run_ramalama pull $model_quant
186+
run_ramalama -q serve --port 1234 --generate=quadlet $model
187+
is "$output" "Generating quadlet file: $quadlet" "generate $quadlet"
186188

187-
run cat tinyllama.container
189+
run cat $quadlet
188190
is "$output" ".*PublishPort=1234:1234" "PublishPort should match"
189191
is "$output" ".*Exec=.*llama-server --port 1234 --model .*" "Exec line should be correct"
190-
is "$output" ".*Mount=type=bind,.*tinyllama" "Mount line should be correct"
192+
is "$output" ".*Mount=type=bind,.*$model" "Mount line should be correct"
191193

192-
HIP_VISIBLE_DEVICES=99 run_ramalama -q serve --port 1234 --generate=quadlet ${model}
193-
is "$output" "Generating quadlet file: tinyllama.container" "generate tinllama.container"
194+
HIP_VISIBLE_DEVICES=99 run_ramalama -q serve --port 1234 --generate=quadlet $model
195+
is "$output" "Generating quadlet file: $quadlet" "generate $quadlet"
194196

195-
run cat tinyllama.container
197+
run cat $quadlet
196198
is "$output" ".*Environment=HIP_VISIBLE_DEVICES=99" "Should contain env property"
197199

198-
rm tinyllama.container
199-
run_ramalama 2 serve --name=${name} --port 1234 --generate=bogus tiny
200+
rm $quadlet
201+
run_ramalama 2 serve --name=${name} --port 1234 --generate=bogus $model
200202
is "$output" ".*error: argument --generate: invalid choice: .*bogus.* (choose from.*quadlet.*kube.*quadlet/kube.*)" "Should fail"
201203
}
202204

@@ -273,33 +275,34 @@ verify_begin=".*run --rm"
273275

274276

275277
@test "ramalama serve --generate=kube" {
276-
model=tiny
278+
model="smollm"
279+
model_quant="$model:135m"
277280
name=c_$(safename)
278-
run_ramalama pull ${model}
279-
run_ramalama serve --name=${name} --port 1234 --generate=kube ${model}
281+
run_ramalama pull $model_quant
282+
run_ramalama serve --name=${name} --port 1234 --generate=kube $model_quant
280283
is "$output" ".*Generating Kubernetes YAML file: ${name}.yaml" "generate .yaml file"
281284

282285
run cat $name.yaml
283286
is "$output" ".*command: \[\".*serve.*\"\]" "Should command"
284287
is "$output" ".*containerPort: 1234" "Should container container port"
285288

286-
HIP_VISIBLE_DEVICES=99 run_ramalama serve --name=${name} --port 1234 --generate=kube ${model}
289+
HIP_VISIBLE_DEVICES=99 run_ramalama serve --name=${name} --port 1234 --generate=kube $model_quant
287290
is "$output" ".*Generating Kubernetes YAML file: ${name}.yaml" "generate .yaml file"
288291

289292
run cat $name.yaml
290293
is "$output" ".*env:" "Should contain env property"
291294
is "$output" ".*name: HIP_VISIBLE_DEVICES" "Should contain env name"
292295
is "$output" ".*value: 99" "Should contain env value"
293296

294-
run_ramalama serve --name=${name} --port 1234 --generate=quadlet/kube ${model}
297+
run_ramalama serve --name=${name} --port 1234 --generate=quadlet/kube $model_quant
295298
is "$output" ".*Generating Kubernetes YAML file: ${name}.yaml" "generate .yaml file"
296299
is "$output" ".*Generating quadlet file: ${name}.kube" "generate .kube file"
297300

298301
run cat $name.yaml
299302
is "$output" ".*command: \[\".*serve.*\"\]" "Should command"
300303
is "$output" ".*containerPort: 1234" "Should container container port"
301304

302-
HIP_VISIBLE_DEVICES=99 run_ramalama serve --name=${name} --port 1234 --generate=quadlet/kube ${model}
305+
HIP_VISIBLE_DEVICES=99 run_ramalama serve --name=${name} --port 1234 --generate=quadlet/kube $model_quant
303306
is "$output" ".*Generating Kubernetes YAML file: ${name}.yaml" "generate .yaml file"
304307

305308
run cat $name.yaml

0 commit comments

Comments
 (0)