#!/bin/bash # Stop and remove existing container if it exists docker rm -f embedding-service 2>/dev/null || true echo "🚀 Starting Local Embedding Service (Hugging Face TEI)..." echo "â„šī¸ Note: The previous image (clems4ever/all-minilm-l6-v2-go) is a CLI tool, not a server." echo " Switching to ghcr.io/huggingface/text-embeddings-inference:cpu-latest which provides a compatible API." # Run Hugging Face Text Embeddings Inference (compatible with OpenAI client) docker run -d \ --name embedding-service \ --restart unless-stopped \ -p 11434:80 \ -e MAX_CONCURRENT_REQUESTS=4 \ ghcr.io/huggingface/text-embeddings-inference:cpu-latest \ --model-id sentence-transformers/all-MiniLM-L6-v2 echo "✅ Service started!" echo " URL: http://localhost:11434/v1"