mirror of
https://github.com/michaelthomson0797/fleet-infra.git
synced 2026-03-21 19:27:21 +00:00
ollama upgrade ctx size
This commit is contained in:
@@ -30,8 +30,13 @@ spec:
|
||||
|
||||
# -- List of models to pull at container startup
|
||||
models:
|
||||
pull:
|
||||
- qwen3.5:9b
|
||||
create:
|
||||
- name: qwen3.5:9b-ctx32768
|
||||
template: |
|
||||
FROM qwen3.5:9b
|
||||
PARAMETER num_ctx 32768
|
||||
run:
|
||||
- qwen3.5:9b-ctx32768
|
||||
|
||||
ingress:
|
||||
enabled: true
|
||||
|
||||
Reference in New Issue
Block a user