feat(rag): add OpenVINO NPU embedding services

This commit is contained in:
William Valentin
2026-06-04 13:07:51 -07:00
parent 83d0ced08c
commit 0a6f84fbf3
6 changed files with 651 additions and 0 deletions
+16
View File
@@ -0,0 +1,16 @@
[Unit]
Description=RAG/Embedding Health HTTP Service (port 18814)
After=network.target
[Service]
Type=simple
ExecStart=/usr/bin/python3 /home/will/lab/swarm/scripts/rag-embedding-health-server.py
Restart=on-failure
RestartSec=5
Environment=PORT=18814
Environment=RAG_HEALTH_TIMEOUT=180
Environment=OLLAMA_BASE_URL=http://127.0.0.1:18817
Environment=RAG_EMBED_MODEL=bge-base-en-v1.5-int8-ov
[Install]
WantedBy=default.target