start_embedding_service.sh
5.21 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
#!/bin/bash
#
# Start Embedding Service (port 6005).
#
# Design:
# - Run in isolated venv `.venv-embedding` (do not pollute main `.venv`)
# - Text backend default: TEI (Qwen3-Embedding-0.6B)
# - Image backend: clip-as-service or local CN-CLIP (from embeddings/config.py)
#
set -euo pipefail
PROJECT_ROOT="$(cd "$(dirname "$0")/.." && pwd)"
cd "${PROJECT_ROOT}"
EMBEDDING_VENV="${EMBEDDING_VENV:-${PROJECT_ROOT}/.venv-embedding}"
PYTHON_BIN="${EMBEDDING_VENV}/bin/python"
if [[ ! -x "${PYTHON_BIN}" ]]; then
echo "ERROR: embedding venv not found: ${EMBEDDING_VENV}" >&2
echo "Please run: ./scripts/setup_embedding_venv.sh" >&2
exit 1
fi
# Load .env if present (same behavior as activate.sh, without activating main venv)
ENV_FILE="${PROJECT_ROOT}/.env"
if [ -f "${ENV_FILE}" ]; then
while IFS= read -r line || [ -n "${line}" ]; do
line="${line%$'\r'}"
[[ -z "${line//[[:space:]]/}" ]] && continue
[[ "${line}" =~ ^[[:space:]]*# ]] && continue
[[ "${line}" != *=* ]] && continue
key="${line%%=*}"
value="${line#*=}"
key="${key#"${key%%[![:space:]]*}"}"
key="${key%"${key##*[![:space:]]}"}"
value="${value#"${value%%[![:space:]]*}"}"
if [[ ${#value} -ge 2 ]]; then
first="${value:0:1}"
last="${value: -1}"
if [[ ("${first}" == '"' && "${last}" == '"') || ("${first}" == "'" && "${last}" == "'") ]]; then
value="${value:1:${#value}-2}"
fi
fi
export "${key}=${value}"
done < "${ENV_FILE}"
fi
DEFAULT_EMBEDDING_SERVICE_HOST=$("${PYTHON_BIN}" -c "from embeddings.config import CONFIG; print(CONFIG.HOST)")
DEFAULT_EMBEDDING_SERVICE_PORT=$("${PYTHON_BIN}" -c "from embeddings.config import CONFIG; print(CONFIG.PORT)")
USE_CLIP_AS_SERVICE=$("${PYTHON_BIN}" -c "from embeddings.config import CONFIG; print('1' if CONFIG.USE_CLIP_AS_SERVICE else '0')")
CLIP_AS_SERVICE_SERVER=$("${PYTHON_BIN}" -c "from embeddings.config import CONFIG; print(CONFIG.CLIP_AS_SERVICE_SERVER)")
TEXT_BACKEND=$("${PYTHON_BIN}" -c "from config.services_config import get_embedding_backend_config; print(get_embedding_backend_config()[0])")
TEI_BASE_URL=$("${PYTHON_BIN}" -c "import os; from config.services_config import get_embedding_backend_config; from embeddings.config import CONFIG; _, cfg = get_embedding_backend_config(); print(os.getenv('TEI_BASE_URL') or cfg.get('base_url') or CONFIG.TEI_BASE_URL)")
ENABLE_IMAGE_MODEL="${EMBEDDING_ENABLE_IMAGE_MODEL:-true}"
ENABLE_IMAGE_MODEL="$(echo "${ENABLE_IMAGE_MODEL}" | tr '[:upper:]' '[:lower:]')"
if [[ "${ENABLE_IMAGE_MODEL}" == "1" || "${ENABLE_IMAGE_MODEL}" == "true" || "${ENABLE_IMAGE_MODEL}" == "yes" ]]; then
IMAGE_MODEL_ENABLED=1
else
IMAGE_MODEL_ENABLED=0
fi
EMBEDDING_SERVICE_HOST="${EMBEDDING_HOST:-${DEFAULT_EMBEDDING_SERVICE_HOST}}"
EMBEDDING_SERVICE_PORT="${EMBEDDING_PORT:-${DEFAULT_EMBEDDING_SERVICE_PORT}}"
if [[ "${TEXT_BACKEND}" == "tei" ]]; then
if ! curl -sf "${TEI_BASE_URL%/}/health" >/dev/null 2>&1; then
echo "ERROR: TEI backend is selected but TEI is not reachable: ${TEI_BASE_URL}/health" >&2
echo "Please start TEI first: ./scripts/start_tei_service.sh" >&2
exit 1
fi
fi
if [[ "${IMAGE_MODEL_ENABLED}" == "1" && "${USE_CLIP_AS_SERVICE}" == "1" ]]; then
CLIP_SERVER="${CLIP_AS_SERVICE_SERVER#*://}"
CLIP_HOST="${CLIP_SERVER%:*}"
CLIP_PORT="${CLIP_SERVER##*:}"
if [[ -z "${CLIP_HOST}" || -z "${CLIP_PORT}" ]]; then
echo "ERROR: invalid CLIP_AS_SERVICE_SERVER: ${CLIP_AS_SERVICE_SERVER}" >&2
exit 1
fi
if ! timeout 2 bash -c "cat < /dev/null > /dev/tcp/${CLIP_HOST}/${CLIP_PORT}" >/dev/null 2>&1; then
echo "ERROR: clip-as-service is not reachable at ${CLIP_AS_SERVICE_SERVER}." >&2
echo "Please start CN-CLIP service first: ./scripts/service_ctl.sh start cnclip" >&2
exit 1
fi
if ! "${PYTHON_BIN}" - <<'PY'
try:
import pkg_resources # noqa: F401
except Exception:
raise SystemExit(1)
PY
then
echo "ERROR: clip-as-service image embedding requires pkg_resources in .venv-embedding." >&2
echo "Please run: ./scripts/setup_embedding_venv.sh" >&2
exit 1
fi
fi
echo "========================================"
echo "Starting Embedding Service"
echo "========================================"
echo "Python: ${PYTHON_BIN}"
echo "Host: ${EMBEDDING_SERVICE_HOST}"
echo "Port: ${EMBEDDING_SERVICE_PORT}"
echo "Text backend: ${TEXT_BACKEND}"
if [[ "${TEXT_BACKEND}" == "tei" ]]; then
echo "TEI URL: ${TEI_BASE_URL}"
fi
if [[ "${IMAGE_MODEL_ENABLED}" == "0" ]]; then
echo "Image backend: disabled"
elif [[ "${USE_CLIP_AS_SERVICE}" == "1" ]]; then
echo "Image backend: clip-as-service (${CLIP_AS_SERVICE_SERVER})"
fi
echo
echo "Tips:"
echo " - Use a single worker (GPU models cannot be safely duplicated across workers)."
echo " - Clients can set EMBEDDING_SERVICE_URL=http://localhost:${EMBEDDING_SERVICE_PORT}"
echo
UVICORN_LOG_LEVEL="${EMBEDDING_UVICORN_LOG_LEVEL:-info}"
UVICORN_ACCESS_LOG="${EMBEDDING_UVICORN_ACCESS_LOG:-true}"
UVICORN_ARGS=(
--host "${EMBEDDING_SERVICE_HOST}"
--port "${EMBEDDING_SERVICE_PORT}"
--workers 1
--log-level "${UVICORN_LOG_LEVEL}"
)
if [[ "${UVICORN_ACCESS_LOG}" == "0" || "${UVICORN_ACCESS_LOG}" == "false" || "${UVICORN_ACCESS_LOG}" == "no" ]]; then
UVICORN_ARGS+=(--no-access-log)
fi
exec "${PYTHON_BIN}" -m uvicorn embeddings.server:app "${UVICORN_ARGS[@]}"