7bfb9946
tangwang
向量化模块
|
1
2
|
#!/bin/bash
#
|
7214c2e7
tangwang
mplemented**
|
3
|
# Start Embedding Service (combined/text/image mode).
|
7bfb9946
tangwang
向量化模块
|
4
|
#
|
07cf5a93
tangwang
START_EMBEDDING=...
|
5
6
7
8
|
# Design:
# - Run in isolated venv `.venv-embedding` (do not pollute main `.venv`)
# - Text backend default: TEI (Qwen3-Embedding-0.6B)
# - Image backend: clip-as-service or local CN-CLIP (from embeddings/config.py)
|
7bfb9946
tangwang
向量化模块
|
9
|
#
|
07cf5a93
tangwang
START_EMBEDDING=...
|
10
11
12
13
14
15
16
17
18
19
20
21
22
|
set -euo pipefail
PROJECT_ROOT="$(cd "$(dirname "$0")/.." && pwd)"
cd "${PROJECT_ROOT}"
EMBEDDING_VENV="${EMBEDDING_VENV:-${PROJECT_ROOT}/.venv-embedding}"
PYTHON_BIN="${EMBEDDING_VENV}/bin/python"
if [[ ! -x "${PYTHON_BIN}" ]]; then
echo "ERROR: embedding venv not found: ${EMBEDDING_VENV}" >&2
echo "Please run: ./scripts/setup_embedding_venv.sh" >&2
exit 1
fi
|
7bfb9946
tangwang
向量化模块
|
23
|
|
7fbca0d7
tangwang
启动脚本优化
|
24
25
26
27
|
# Load .env without activating main venv.
# shellcheck source=scripts/lib/load_env.sh
source "${PROJECT_ROOT}/scripts/lib/load_env.sh"
load_env_file "${PROJECT_ROOT}/.env"
|
07cf5a93
tangwang
START_EMBEDDING=...
|
28
29
30
31
32
|
DEFAULT_EMBEDDING_SERVICE_HOST=$("${PYTHON_BIN}" -c "from embeddings.config import CONFIG; print(CONFIG.HOST)")
DEFAULT_EMBEDDING_SERVICE_PORT=$("${PYTHON_BIN}" -c "from embeddings.config import CONFIG; print(CONFIG.PORT)")
USE_CLIP_AS_SERVICE=$("${PYTHON_BIN}" -c "from embeddings.config import CONFIG; print('1' if CONFIG.USE_CLIP_AS_SERVICE else '0')")
CLIP_AS_SERVICE_SERVER=$("${PYTHON_BIN}" -c "from embeddings.config import CONFIG; print(CONFIG.CLIP_AS_SERVICE_SERVER)")
|
4747e2f4
tangwang
embedding perform...
|
33
|
CLIP_AS_SERVICE_MODEL_NAME=$("${PYTHON_BIN}" -c "from embeddings.config import CONFIG; print(CONFIG.CLIP_AS_SERVICE_MODEL_NAME)")
|
07cf5a93
tangwang
START_EMBEDDING=...
|
34
35
|
TEXT_BACKEND=$("${PYTHON_BIN}" -c "from config.services_config import get_embedding_backend_config; print(get_embedding_backend_config()[0])")
TEI_BASE_URL=$("${PYTHON_BIN}" -c "import os; from config.services_config import get_embedding_backend_config; from embeddings.config import CONFIG; _, cfg = get_embedding_backend_config(); print(os.getenv('TEI_BASE_URL') or cfg.get('base_url') or CONFIG.TEI_BASE_URL)")
|
7214c2e7
tangwang
mplemented**
|
36
37
38
39
40
41
42
43
44
|
SERVICE_KIND="${1:-${EMBEDDING_SERVICE_KIND:-all}}"
SERVICE_KIND="$(echo "${SERVICE_KIND}" | tr '[:upper:]' '[:lower:]')"
if [[ "${SERVICE_KIND}" != "all" && "${SERVICE_KIND}" != "text" && "${SERVICE_KIND}" != "image" ]]; then
echo "ERROR: invalid embedding service kind: ${SERVICE_KIND}. expected all|text|image" >&2
exit 1
fi
ENABLE_TEXT_MODEL="${EMBEDDING_ENABLE_TEXT_MODEL:-true}"
ENABLE_TEXT_MODEL="$(echo "${ENABLE_TEXT_MODEL}" | tr '[:upper:]' '[:lower:]')"
|
efd435cf
tangwang
tei性能调优:
|
45
46
|
ENABLE_IMAGE_MODEL="${EMBEDDING_ENABLE_IMAGE_MODEL:-true}"
ENABLE_IMAGE_MODEL="$(echo "${ENABLE_IMAGE_MODEL}" | tr '[:upper:]' '[:lower:]')"
|
7214c2e7
tangwang
mplemented**
|
47
48
49
50
51
52
53
54
55
56
57
58
|
TEXT_MODEL_ENABLED=0
IMAGE_MODEL_ENABLED=0
if [[ "${SERVICE_KIND}" == "all" || "${SERVICE_KIND}" == "text" ]]; then
if [[ "${ENABLE_TEXT_MODEL}" == "1" || "${ENABLE_TEXT_MODEL}" == "true" || "${ENABLE_TEXT_MODEL}" == "yes" ]]; then
TEXT_MODEL_ENABLED=1
fi
fi
if [[ "${SERVICE_KIND}" == "all" || "${SERVICE_KIND}" == "image" ]]; then
if [[ "${ENABLE_IMAGE_MODEL}" == "1" || "${ENABLE_IMAGE_MODEL}" == "true" || "${ENABLE_IMAGE_MODEL}" == "yes" ]]; then
IMAGE_MODEL_ENABLED=1
fi
|
efd435cf
tangwang
tei性能调优:
|
59
|
fi
|
d1d356f8
tangwang
脚本优化
|
60
61
|
EMBEDDING_SERVICE_HOST="${EMBEDDING_HOST:-${DEFAULT_EMBEDDING_SERVICE_HOST}}"
|
7214c2e7
tangwang
mplemented**
|
62
|
if [[ "${SERVICE_KIND}" == "text" ]]; then
|
af03fdef
tangwang
embedding模块代码整理
|
63
|
EMBEDDING_SERVICE_PORT="${EMBEDDING_TEXT_PORT:-6005}"
|
7214c2e7
tangwang
mplemented**
|
64
65
66
67
68
|
elif [[ "${SERVICE_KIND}" == "image" ]]; then
EMBEDDING_SERVICE_PORT="${EMBEDDING_IMAGE_PORT:-6008}"
else
EMBEDDING_SERVICE_PORT="${EMBEDDING_PORT:-${DEFAULT_EMBEDDING_SERVICE_PORT}}"
fi
|
7bfb9946
tangwang
向量化模块
|
69
|
|
7214c2e7
tangwang
mplemented**
|
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
|
export EMBEDDING_SERVICE_KIND="${SERVICE_KIND}"
export EMBEDDING_HOST="${EMBEDDING_SERVICE_HOST}"
export EMBEDDING_PORT="${EMBEDDING_SERVICE_PORT}"
if [[ "${TEXT_MODEL_ENABLED}" == "1" ]]; then
export EMBEDDING_ENABLE_TEXT_MODEL=true
else
export EMBEDDING_ENABLE_TEXT_MODEL=false
fi
if [[ "${IMAGE_MODEL_ENABLED}" == "1" ]]; then
export EMBEDDING_ENABLE_IMAGE_MODEL=true
else
export EMBEDDING_ENABLE_IMAGE_MODEL=false
fi
if [[ "${TEXT_MODEL_ENABLED}" == "1" && "${TEXT_BACKEND}" == "tei" ]]; then
|
07cf5a93
tangwang
START_EMBEDDING=...
|
85
86
87
88
89
90
91
|
if ! curl -sf "${TEI_BASE_URL%/}/health" >/dev/null 2>&1; then
echo "ERROR: TEI backend is selected but TEI is not reachable: ${TEI_BASE_URL}/health" >&2
echo "Please start TEI first: ./scripts/start_tei_service.sh" >&2
exit 1
fi
fi
|
efd435cf
tangwang
tei性能调优:
|
92
|
if [[ "${IMAGE_MODEL_ENABLED}" == "1" && "${USE_CLIP_AS_SERVICE}" == "1" ]]; then
|
07cf5a93
tangwang
START_EMBEDDING=...
|
93
94
95
96
97
98
99
100
101
102
103
104
105
|
CLIP_SERVER="${CLIP_AS_SERVICE_SERVER#*://}"
CLIP_HOST="${CLIP_SERVER%:*}"
CLIP_PORT="${CLIP_SERVER##*:}"
if [[ -z "${CLIP_HOST}" || -z "${CLIP_PORT}" ]]; then
echo "ERROR: invalid CLIP_AS_SERVICE_SERVER: ${CLIP_AS_SERVICE_SERVER}" >&2
exit 1
fi
if ! timeout 2 bash -c "cat < /dev/null > /dev/tcp/${CLIP_HOST}/${CLIP_PORT}" >/dev/null 2>&1; then
echo "ERROR: clip-as-service is not reachable at ${CLIP_AS_SERVICE_SERVER}." >&2
echo "Please start CN-CLIP service first: ./scripts/service_ctl.sh start cnclip" >&2
exit 1
fi
if ! "${PYTHON_BIN}" - <<'PY'
|
ed948666
tangwang
tidy
|
106
107
108
109
110
111
|
try:
import pkg_resources # noqa: F401
except Exception:
raise SystemExit(1)
PY
then
|
07cf5a93
tangwang
START_EMBEDDING=...
|
112
113
|
echo "ERROR: clip-as-service image embedding requires pkg_resources in .venv-embedding." >&2
echo "Please run: ./scripts/setup_embedding_venv.sh" >&2
|
ed948666
tangwang
tidy
|
114
115
116
117
|
exit 1
fi
fi
|
7bfb9946
tangwang
向量化模块
|
118
|
echo "========================================"
|
07cf5a93
tangwang
START_EMBEDDING=...
|
119
|
echo "Starting Embedding Service"
|
7bfb9946
tangwang
向量化模块
|
120
|
echo "========================================"
|
7214c2e7
tangwang
mplemented**
|
121
|
echo "Kind: ${SERVICE_KIND}"
|
07cf5a93
tangwang
START_EMBEDDING=...
|
122
|
echo "Python: ${PYTHON_BIN}"
|
7bfb9946
tangwang
向量化模块
|
123
124
|
echo "Host: ${EMBEDDING_SERVICE_HOST}"
echo "Port: ${EMBEDDING_SERVICE_PORT}"
|
7214c2e7
tangwang
mplemented**
|
125
126
127
128
129
130
|
echo "Text backend enabled: ${TEXT_MODEL_ENABLED}"
if [[ "${TEXT_MODEL_ENABLED}" == "1" ]]; then
echo "Text backend: ${TEXT_BACKEND}"
echo "Text max inflight: ${TEXT_MAX_INFLIGHT:-32}"
fi
if [[ "${TEXT_MODEL_ENABLED}" == "1" && "${TEXT_BACKEND}" == "tei" ]]; then
|
07cf5a93
tangwang
START_EMBEDDING=...
|
131
132
|
echo "TEI URL: ${TEI_BASE_URL}"
fi
|
efd435cf
tangwang
tei性能调优:
|
133
134
135
|
if [[ "${IMAGE_MODEL_ENABLED}" == "0" ]]; then
echo "Image backend: disabled"
elif [[ "${USE_CLIP_AS_SERVICE}" == "1" ]]; then
|
4747e2f4
tangwang
embedding perform...
|
136
|
echo "Image backend: clip-as-service (${CLIP_AS_SERVICE_SERVER}, model=${CLIP_AS_SERVICE_MODEL_NAME})"
|
07cf5a93
tangwang
START_EMBEDDING=...
|
137
|
fi
|
7214c2e7
tangwang
mplemented**
|
138
139
140
|
if [[ "${IMAGE_MODEL_ENABLED}" == "1" ]]; then
echo "Image max inflight: ${IMAGE_MAX_INFLIGHT:-1}"
fi
|
4747e2f4
tangwang
embedding perform...
|
141
|
echo "Logs: logs/embedding_api.log, logs/embedding_api_error.log, logs/verbose/embedding_verbose.log"
|
7bfb9946
tangwang
向量化模块
|
142
143
144
|
echo
echo "Tips:"
echo " - Use a single worker (GPU models cannot be safely duplicated across workers)."
|
7214c2e7
tangwang
mplemented**
|
145
146
147
148
149
|
if [[ "${SERVICE_KIND}" == "text" ]]; then
echo " - Clients can set EMBEDDING_TEXT_SERVICE_URL=http://localhost:${EMBEDDING_SERVICE_PORT}"
elif [[ "${SERVICE_KIND}" == "image" ]]; then
echo " - Clients can set EMBEDDING_IMAGE_SERVICE_URL=http://localhost:${EMBEDDING_SERVICE_PORT}"
else
|
af03fdef
tangwang
embedding模块代码整理
|
150
|
echo " - All mode serves both /embed/text and /embed/image on port ${EMBEDDING_SERVICE_PORT}"
|
7214c2e7
tangwang
mplemented**
|
151
|
fi
|
7bfb9946
tangwang
向量化模块
|
152
153
|
echo
|
efd435cf
tangwang
tei性能调优:
|
154
155
156
157
158
|
UVICORN_LOG_LEVEL="${EMBEDDING_UVICORN_LOG_LEVEL:-info}"
UVICORN_ACCESS_LOG="${EMBEDDING_UVICORN_ACCESS_LOG:-true}"
UVICORN_ARGS=(
--host "${EMBEDDING_SERVICE_HOST}"
--port "${EMBEDDING_SERVICE_PORT}"
|
7bfb9946
tangwang
向量化模块
|
159
|
--workers 1
|
efd435cf
tangwang
tei性能调优:
|
160
161
162
163
164
165
166
|
--log-level "${UVICORN_LOG_LEVEL}"
)
if [[ "${UVICORN_ACCESS_LOG}" == "0" || "${UVICORN_ACCESS_LOG}" == "false" || "${UVICORN_ACCESS_LOG}" == "no" ]]; then
UVICORN_ARGS+=(--no-access-log)
fi
exec "${PYTHON_BIN}" -m uvicorn embeddings.server:app "${UVICORN_ARGS[@]}"
|