diff --git a/model-orchestrator/models.yaml b/model-orchestrator/models.yaml index c78a529..abc6d63 100644 --- a/model-orchestrator/models.yaml +++ b/model-orchestrator/models.yaml @@ -6,7 +6,7 @@ models: qwen-2.5-7b: type: text framework: vllm - service_script: models/vllm/server.py + service_script: vllm/server.py port: 8000 vram_gb: 14 startup_time_seconds: 120 @@ -16,7 +16,7 @@ models: llama-3.1-8b: type: text framework: vllm - service_script: models/vllm/server.py + service_script: vllm/server.py port: 8001 vram_gb: 17 startup_time_seconds: 120