Initial PoC commit

2026-01-28 20:39:59 -08:00
commit 94811ca7c1
18 changed files with 1831 additions and 0 deletions
--- a/Server/vllm-htr.service
+++ b/Server/vllm-htr.service
@@ -0,0 +1,36 @@
+# ===========================================
+# vLLM HTR Service
+# Reads configuration from /home/fenix/htr-api/.env
+# ===========================================
+# BACKUP COPY - After editing, run:
+#   sudo cp ~/htr-api/vllm-htr.service /etc/systemd/system/
+#   sudo systemctl daemon-reload && sudo systemctl restart vllm-htr
+# ===========================================
+
+[Unit]
+Description=vLLM Server for HTR
+After=network.target
+
+[Service]
+Type=simple
+User=fenix
+WorkingDirectory=/llm
+
+# Load environment variables from .env
+EnvironmentFile=/home/fenix/htr-api/.env
+
+# Use environment variables in ExecStart
+ExecStart=/llm/env/bin/vllm serve ${VLLM_MODEL_PATH} \
+    --host ${VLLM_HOST} \
+    --port ${VLLM_PORT} \
+    --max-model-len ${VLLM_MAX_MODEL_LEN} \
+    --gpu-memory-utilization ${VLLM_GPU_UTIL} \
+    --trust-remote-code \
+    --served-model-name ${VLLM_MODEL_NAME}
+
+Restart=on-failure
+RestartSec=10
+TimeoutStartSec=300
+
+[Install]
+WantedBy=multi-user.target