34 lines
794 B
Plaintext
34 lines
794 B
Plaintext
|
|
# TurboQuant Fleet Inventory
|
||
|
|
# Copy to inventory.ini and update with actual hosts
|
||
|
|
|
||
|
|
[turboquant_fleet]
|
||
|
|
# Mac (Timmy) - M1, 16GB
|
||
|
|
timmy ansible_host=192.168.1.100 ansible_user=apayne
|
||
|
|
|
||
|
|
# Allegro VPS - 2 cores, 8GB
|
||
|
|
allegro ansible_host=167.99.126.228 ansible_user=root
|
||
|
|
|
||
|
|
# Ezra VPS - TBD
|
||
|
|
# ezra ansible_host=TBD ansible_user=root
|
||
|
|
|
||
|
|
[turboquant_fleet:vars]
|
||
|
|
ansible_python_interpreter=/usr/bin/python3
|
||
|
|
|
||
|
|
# Per-host configuration
|
||
|
|
[turboquant_fleet:vars]
|
||
|
|
model_base_path=/opt/models
|
||
|
|
llama_cpp_port=8081
|
||
|
|
turboquant_kv_type=turbo4
|
||
|
|
turboquant_layer_mode=7
|
||
|
|
max_context_tokens=131072
|
||
|
|
|
||
|
|
# Node-specific overrides
|
||
|
|
[timmy:vars]
|
||
|
|
gemma4_model_filename=gemma-4-26B-A4B-q4_k_m.gguf
|
||
|
|
max_context_tokens=131072
|
||
|
|
|
||
|
|
[allegro:vars]
|
||
|
|
gemma4_model_filename=gemma-4-E4B-q4_0.gguf
|
||
|
|
max_context_tokens=32768
|
||
|
|
turboquant_kv_type=turbo2
|