- Complete Fastify gateway with 8-stage pipeline - Circuit breaker (opossum) per model tier - Rate limiting per caller - Ban list validation (EN/DE/auto-detected) - TIP validator (SFF-8024, part numbers, wavelengths) - Prometheus metrics - pg-boss async queue - PostgreSQL audit log + review queue - 9 prompt templates (TIP, LinkedIn, ShieldX) - Learning engine scaffolding - Auto-learning: ban-list, few-shot, routing, prompt optimizer
9 lines
422 B
Bash
Executable File
9 lines
422 B
Bash
Executable File
#!/bin/bash
|
|
OLLAMA_URL="${OLLAMA_URL:-http://192.168.178.169:11434}"
|
|
echo "Pulling models from $OLLAMA_URL..."
|
|
for model in "qwen2.5:3b" "qwen2.5:14b" "qwen2.5:32b"; do
|
|
echo "Pulling $model..."
|
|
curl -s -X POST "$OLLAMA_URL/api/pull" -d "{\"name\":\"$model\"}" | python3 -c "import sys; [print(l) for l in sys.stdin.read().split('\n') if 'status' in l]" 2>/dev/null || echo "Done: $model"
|
|
done
|
|
echo "All models pulled"
|