Files
turboquant/ansible/roles/turboquant-deploy/tasks/integration_test.yml

39 lines
973 B
YAML

---
# Post-deploy integration tests
- name: Wait for TurboQuant service to be ready
uri:
url: "http://localhost:{{ llama_cpp_port }}/v1/models"
method: GET
status_code: 200
register: model_check
retries: 30
delay: 5
until: model_check.status == 200
- name: Test inference with tool call
uri:
url: "http://localhost:{{ llama_cpp_port }}/v1/chat/completions"
method: POST
body_format: json
body:
model: "gemma-4"
messages:
- role: "user"
content: "Say 'test passed' and nothing else."
max_tokens: 20
status_code: 200
register: inference_test
- name: Verify inference response
assert:
that:
- "'choices' in inference_test.json"
- "inference_test.json.choices | length > 0"
fail_msg: "Inference test failed - no valid response"
success_msg: "Inference test passed"
- name: Report test results
debug:
msg: "Integration test passed on {{ inventory_hostname }}"