fix: remove incorrect start-vllm.sh that would break orchestrator architecture

2025-11-21 18:10:53 +01:00
parent 6944e4ebd5
commit 94080da341
1 changed files with 0 additions and 12 deletions
--- a/start-vllm.sh
+++ b/start-vllm.sh
@@ -1,12 +0,0 @@
 #!/bin/bash
 # Start vLLM server with OpenAI-compatible API
 # This uses vLLM's built-in server which properly handles streaming
 vllm serve Qwen/Qwen2.5-7B-Instruct \
  --host 0.0.0.0 \
  --port 9000 \
  --tensor-parallel-size 1 \
  --gpu-memory-utilization 0.85 \
  --max-model-len 4096 \
  --download-dir /workspace/huggingface_cache \
  --trust-remote-code