20 lines
618 B
YAML
20 lines
618 B
YAML
---
|
|
vllm_install_dir: /opt/vllm
|
|
vllm_model_dir: "{{ vllm_install_dir }}/data"
|
|
vllm_image: vllm/vllm-openai
|
|
vllm_image_tag: latest
|
|
vllm_container_labels: []
|
|
vllm_container_env: {}
|
|
#https://www.jan.ai/docs/desktop/jan-models/jan-code-4b
|
|
# vllm_model: "unsloth/Qwen3.5-35B-A3B-GGUF"
|
|
#DavidAU/Qwen3.5-40B-Claude-4.6-Opus-Deckard-Heretic-Uncensored-Thinking
|
|
#DavidAU/Qwen3.5-40B-RoughHouse-Claude-4.6-Opus-Polar-Deckard-Uncensored-Heretic-Thinking
|
|
vllm_model: "unsloth/Qwen3.5-35B-A3B-GGUF"
|
|
vllm_args:
|
|
- --enable-prefix-caching
|
|
- --enable-auto-tool-choice
|
|
- --reasoning-parser
|
|
- qwen3
|
|
- --tool-call-parser
|
|
- qwen3_coder
|