start_embedding_service.sh
4.45 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
#!/bin/bash
#
# Start Embedding Service (port 6005).
#
# Design:
# - Run in isolated venv `.venv-embedding` (do not pollute main `.venv`)
# - Text backend default: TEI (Qwen3-Embedding-0.6B)
# - Image backend: clip-as-service or local CN-CLIP (from embeddings/config.py)
#
set -euo pipefail
PROJECT_ROOT="$(cd "$(dirname "$0")/.." && pwd)"
cd "${PROJECT_ROOT}"
EMBEDDING_VENV="${EMBEDDING_VENV:-${PROJECT_ROOT}/.venv-embedding}"
PYTHON_BIN="${EMBEDDING_VENV}/bin/python"
if [[ ! -x "${PYTHON_BIN}" ]]; then
echo "ERROR: embedding venv not found: ${EMBEDDING_VENV}" >&2
echo "Please run: ./scripts/setup_embedding_venv.sh" >&2
exit 1
fi
# Load .env if present (same behavior as activate.sh, without activating main venv)
ENV_FILE="${PROJECT_ROOT}/.env"
if [ -f "${ENV_FILE}" ]; then
while IFS= read -r line || [ -n "${line}" ]; do
line="${line%$'\r'}"
[[ -z "${line//[[:space:]]/}" ]] && continue
[[ "${line}" =~ ^[[:space:]]*# ]] && continue
[[ "${line}" != *=* ]] && continue
key="${line%%=*}"
value="${line#*=}"
key="${key#"${key%%[![:space:]]*}"}"
key="${key%"${key##*[![:space:]]}"}"
value="${value#"${value%%[![:space:]]*}"}"
if [[ ${#value} -ge 2 ]]; then
first="${value:0:1}"
last="${value: -1}"
if [[ ("${first}" == '"' && "${last}" == '"') || ("${first}" == "'" && "${last}" == "'") ]]; then
value="${value:1:${#value}-2}"
fi
fi
export "${key}=${value}"
done < "${ENV_FILE}"
fi
DEFAULT_EMBEDDING_SERVICE_HOST=$("${PYTHON_BIN}" -c "from embeddings.config import CONFIG; print(CONFIG.HOST)")
DEFAULT_EMBEDDING_SERVICE_PORT=$("${PYTHON_BIN}" -c "from embeddings.config import CONFIG; print(CONFIG.PORT)")
USE_CLIP_AS_SERVICE=$("${PYTHON_BIN}" -c "from embeddings.config import CONFIG; print('1' if CONFIG.USE_CLIP_AS_SERVICE else '0')")
CLIP_AS_SERVICE_SERVER=$("${PYTHON_BIN}" -c "from embeddings.config import CONFIG; print(CONFIG.CLIP_AS_SERVICE_SERVER)")
TEXT_BACKEND=$("${PYTHON_BIN}" -c "from config.services_config import get_embedding_backend_config; print(get_embedding_backend_config()[0])")
TEI_BASE_URL=$("${PYTHON_BIN}" -c "import os; from config.services_config import get_embedding_backend_config; from embeddings.config import CONFIG; _, cfg = get_embedding_backend_config(); print(os.getenv('TEI_BASE_URL') or cfg.get('base_url') or CONFIG.TEI_BASE_URL)")
EMBEDDING_SERVICE_HOST="${EMBEDDING_HOST:-${DEFAULT_EMBEDDING_SERVICE_HOST}}"
EMBEDDING_SERVICE_PORT="${EMBEDDING_PORT:-${DEFAULT_EMBEDDING_SERVICE_PORT}}"
if [[ "${TEXT_BACKEND}" == "tei" ]]; then
if ! curl -sf "${TEI_BASE_URL%/}/health" >/dev/null 2>&1; then
echo "ERROR: TEI backend is selected but TEI is not reachable: ${TEI_BASE_URL}/health" >&2
echo "Please start TEI first: ./scripts/start_tei_service.sh" >&2
exit 1
fi
fi
if [[ "${USE_CLIP_AS_SERVICE}" == "1" ]]; then
CLIP_SERVER="${CLIP_AS_SERVICE_SERVER#*://}"
CLIP_HOST="${CLIP_SERVER%:*}"
CLIP_PORT="${CLIP_SERVER##*:}"
if [[ -z "${CLIP_HOST}" || -z "${CLIP_PORT}" ]]; then
echo "ERROR: invalid CLIP_AS_SERVICE_SERVER: ${CLIP_AS_SERVICE_SERVER}" >&2
exit 1
fi
if ! timeout 2 bash -c "cat < /dev/null > /dev/tcp/${CLIP_HOST}/${CLIP_PORT}" >/dev/null 2>&1; then
echo "ERROR: clip-as-service is not reachable at ${CLIP_AS_SERVICE_SERVER}." >&2
echo "Please start CN-CLIP service first: ./scripts/service_ctl.sh start cnclip" >&2
exit 1
fi
if ! "${PYTHON_BIN}" - <<'PY'
try:
import pkg_resources # noqa: F401
except Exception:
raise SystemExit(1)
PY
then
echo "ERROR: clip-as-service image embedding requires pkg_resources in .venv-embedding." >&2
echo "Please run: ./scripts/setup_embedding_venv.sh" >&2
exit 1
fi
fi
echo "========================================"
echo "Starting Embedding Service"
echo "========================================"
echo "Python: ${PYTHON_BIN}"
echo "Host: ${EMBEDDING_SERVICE_HOST}"
echo "Port: ${EMBEDDING_SERVICE_PORT}"
echo "Text backend: ${TEXT_BACKEND}"
if [[ "${TEXT_BACKEND}" == "tei" ]]; then
echo "TEI URL: ${TEI_BASE_URL}"
fi
if [[ "${USE_CLIP_AS_SERVICE}" == "1" ]]; then
echo "Image backend: clip-as-service (${CLIP_AS_SERVICE_SERVER})"
fi
echo
echo "Tips:"
echo " - Use a single worker (GPU models cannot be safely duplicated across workers)."
echo " - Clients can set EMBEDDING_SERVICE_URL=http://localhost:${EMBEDDING_SERVICE_PORT}"
echo
exec "${PYTHON_BIN}" -m uvicorn embeddings.server:app \
--host "${EMBEDDING_SERVICE_HOST}" \
--port "${EMBEDDING_SERVICE_PORT}" \
--workers 1