Blame view

scripts/start_embedding_service.sh 4.92 KB
7bfb9946   tangwang   向量化模块
1
2
  #!/bin/bash
  #
07cf5a93   tangwang   START_EMBEDDING=...
3
  # Start Embedding Service (port 6005).
7bfb9946   tangwang   向量化模块
4
  #
07cf5a93   tangwang   START_EMBEDDING=...
5
6
7
8
  # Design:
  # - Run in isolated venv `.venv-embedding` (do not pollute main `.venv`)
  # - Text backend default: TEI (Qwen3-Embedding-0.6B)
  # - Image backend: clip-as-service or local CN-CLIP (from embeddings/config.py)
7bfb9946   tangwang   向量化模块
9
  #
07cf5a93   tangwang   START_EMBEDDING=...
10
11
12
13
14
15
16
17
18
19
20
21
22
  set -euo pipefail
  
  PROJECT_ROOT="$(cd "$(dirname "$0")/.." && pwd)"
  cd "${PROJECT_ROOT}"
  
  EMBEDDING_VENV="${EMBEDDING_VENV:-${PROJECT_ROOT}/.venv-embedding}"
  PYTHON_BIN="${EMBEDDING_VENV}/bin/python"
  
  if [[ ! -x "${PYTHON_BIN}" ]]; then
    echo "ERROR: embedding venv not found: ${EMBEDDING_VENV}" >&2
    echo "Please run: ./scripts/setup_embedding_venv.sh" >&2
    exit 1
  fi
7bfb9946   tangwang   向量化模块
23
  
7fbca0d7   tangwang   启动脚本优化
24
25
26
27
  # Load .env without activating main venv.
  # shellcheck source=scripts/lib/load_env.sh
  source "${PROJECT_ROOT}/scripts/lib/load_env.sh"
  load_env_file "${PROJECT_ROOT}/.env"
07cf5a93   tangwang   START_EMBEDDING=...
28
29
30
31
32
  
  DEFAULT_EMBEDDING_SERVICE_HOST=$("${PYTHON_BIN}" -c "from embeddings.config import CONFIG; print(CONFIG.HOST)")
  DEFAULT_EMBEDDING_SERVICE_PORT=$("${PYTHON_BIN}" -c "from embeddings.config import CONFIG; print(CONFIG.PORT)")
  USE_CLIP_AS_SERVICE=$("${PYTHON_BIN}" -c "from embeddings.config import CONFIG; print('1' if CONFIG.USE_CLIP_AS_SERVICE else '0')")
  CLIP_AS_SERVICE_SERVER=$("${PYTHON_BIN}" -c "from embeddings.config import CONFIG; print(CONFIG.CLIP_AS_SERVICE_SERVER)")
4747e2f4   tangwang   embedding perform...
33
  CLIP_AS_SERVICE_MODEL_NAME=$("${PYTHON_BIN}" -c "from embeddings.config import CONFIG; print(CONFIG.CLIP_AS_SERVICE_MODEL_NAME)")
07cf5a93   tangwang   START_EMBEDDING=...
34
35
  TEXT_BACKEND=$("${PYTHON_BIN}" -c "from config.services_config import get_embedding_backend_config; print(get_embedding_backend_config()[0])")
  TEI_BASE_URL=$("${PYTHON_BIN}" -c "import os; from config.services_config import get_embedding_backend_config; from embeddings.config import CONFIG; _, cfg = get_embedding_backend_config(); print(os.getenv('TEI_BASE_URL') or cfg.get('base_url') or CONFIG.TEI_BASE_URL)")
efd435cf   tangwang   tei性能调优:
36
37
38
39
40
41
42
  ENABLE_IMAGE_MODEL="${EMBEDDING_ENABLE_IMAGE_MODEL:-true}"
  ENABLE_IMAGE_MODEL="$(echo "${ENABLE_IMAGE_MODEL}" | tr '[:upper:]' '[:lower:]')"
  if [[ "${ENABLE_IMAGE_MODEL}" == "1" || "${ENABLE_IMAGE_MODEL}" == "true" || "${ENABLE_IMAGE_MODEL}" == "yes" ]]; then
    IMAGE_MODEL_ENABLED=1
  else
    IMAGE_MODEL_ENABLED=0
  fi
d1d356f8   tangwang   脚本优化
43
44
45
  
  EMBEDDING_SERVICE_HOST="${EMBEDDING_HOST:-${DEFAULT_EMBEDDING_SERVICE_HOST}}"
  EMBEDDING_SERVICE_PORT="${EMBEDDING_PORT:-${DEFAULT_EMBEDDING_SERVICE_PORT}}"
7bfb9946   tangwang   向量化模块
46
  
07cf5a93   tangwang   START_EMBEDDING=...
47
48
49
50
51
52
53
54
  if [[ "${TEXT_BACKEND}" == "tei" ]]; then
    if ! curl -sf "${TEI_BASE_URL%/}/health" >/dev/null 2>&1; then
      echo "ERROR: TEI backend is selected but TEI is not reachable: ${TEI_BASE_URL}/health" >&2
      echo "Please start TEI first: ./scripts/start_tei_service.sh" >&2
      exit 1
    fi
  fi
  
efd435cf   tangwang   tei性能调优:
55
  if [[ "${IMAGE_MODEL_ENABLED}" == "1" && "${USE_CLIP_AS_SERVICE}" == "1" ]]; then
07cf5a93   tangwang   START_EMBEDDING=...
56
57
58
59
60
61
62
63
64
65
66
67
68
    CLIP_SERVER="${CLIP_AS_SERVICE_SERVER#*://}"
    CLIP_HOST="${CLIP_SERVER%:*}"
    CLIP_PORT="${CLIP_SERVER##*:}"
    if [[ -z "${CLIP_HOST}" || -z "${CLIP_PORT}" ]]; then
      echo "ERROR: invalid CLIP_AS_SERVICE_SERVER: ${CLIP_AS_SERVICE_SERVER}" >&2
      exit 1
    fi
    if ! timeout 2 bash -c "cat < /dev/null > /dev/tcp/${CLIP_HOST}/${CLIP_PORT}" >/dev/null 2>&1; then
      echo "ERROR: clip-as-service is not reachable at ${CLIP_AS_SERVICE_SERVER}." >&2
      echo "Please start CN-CLIP service first: ./scripts/service_ctl.sh start cnclip" >&2
      exit 1
    fi
    if ! "${PYTHON_BIN}" - <<'PY'
ed948666   tangwang   tidy
69
70
71
72
73
74
  try:
      import pkg_resources  # noqa: F401
  except Exception:
      raise SystemExit(1)
  PY
    then
07cf5a93   tangwang   START_EMBEDDING=...
75
76
      echo "ERROR: clip-as-service image embedding requires pkg_resources in .venv-embedding." >&2
      echo "Please run: ./scripts/setup_embedding_venv.sh" >&2
ed948666   tangwang   tidy
77
78
79
80
      exit 1
    fi
  fi
  
7bfb9946   tangwang   向量化模块
81
  echo "========================================"
07cf5a93   tangwang   START_EMBEDDING=...
82
  echo "Starting Embedding Service"
7bfb9946   tangwang   向量化模块
83
  echo "========================================"
07cf5a93   tangwang   START_EMBEDDING=...
84
  echo "Python: ${PYTHON_BIN}"
7bfb9946   tangwang   向量化模块
85
86
  echo "Host: ${EMBEDDING_SERVICE_HOST}"
  echo "Port: ${EMBEDDING_SERVICE_PORT}"
07cf5a93   tangwang   START_EMBEDDING=...
87
  echo "Text backend: ${TEXT_BACKEND}"
4747e2f4   tangwang   embedding perform...
88
  echo "Text max inflight: ${TEXT_MAX_INFLIGHT:-32}"
07cf5a93   tangwang   START_EMBEDDING=...
89
90
91
  if [[ "${TEXT_BACKEND}" == "tei" ]]; then
    echo "TEI URL: ${TEI_BASE_URL}"
  fi
efd435cf   tangwang   tei性能调优:
92
93
94
  if [[ "${IMAGE_MODEL_ENABLED}" == "0" ]]; then
    echo "Image backend: disabled"
  elif [[ "${USE_CLIP_AS_SERVICE}" == "1" ]]; then
4747e2f4   tangwang   embedding perform...
95
    echo "Image backend: clip-as-service (${CLIP_AS_SERVICE_SERVER}, model=${CLIP_AS_SERVICE_MODEL_NAME})"
07cf5a93   tangwang   START_EMBEDDING=...
96
  fi
4747e2f4   tangwang   embedding perform...
97
98
  echo "Image max inflight: ${IMAGE_MAX_INFLIGHT:-1}"
  echo "Logs: logs/embedding_api.log, logs/embedding_api_error.log, logs/verbose/embedding_verbose.log"
7bfb9946   tangwang   向量化模块
99
100
101
102
103
104
  echo
  echo "Tips:"
  echo "  - Use a single worker (GPU models cannot be safely duplicated across workers)."
  echo "  - Clients can set EMBEDDING_SERVICE_URL=http://localhost:${EMBEDDING_SERVICE_PORT}"
  echo
  
efd435cf   tangwang   tei性能调优:
105
106
107
108
109
  UVICORN_LOG_LEVEL="${EMBEDDING_UVICORN_LOG_LEVEL:-info}"
  UVICORN_ACCESS_LOG="${EMBEDDING_UVICORN_ACCESS_LOG:-true}"
  UVICORN_ARGS=(
    --host "${EMBEDDING_SERVICE_HOST}"
    --port "${EMBEDDING_SERVICE_PORT}"
7bfb9946   tangwang   向量化模块
110
    --workers 1
efd435cf   tangwang   tei性能调优:
111
112
113
114
115
116
117
    --log-level "${UVICORN_LOG_LEVEL}"
  )
  if [[ "${UVICORN_ACCESS_LOG}" == "0" || "${UVICORN_ACCESS_LOG}" == "false" || "${UVICORN_ACCESS_LOG}" == "no" ]]; then
    UVICORN_ARGS+=(--no-access-log)
  fi
  
  exec "${PYTHON_BIN}" -m uvicorn embeddings.server:app "${UVICORN_ARGS[@]}"