Blame view

scripts/start_reranker.sh 3.29 KB
d1d356f8   tangwang   脚本优化
1
2
  #!/bin/bash
  #
07cf5a93   tangwang   START_EMBEDDING=...
3
  # Start reranker service from isolated venv (.venv-reranker).
d1d356f8   tangwang   脚本优化
4
  #
07cf5a93   tangwang   START_EMBEDDING=...
5
  set -euo pipefail
d1d356f8   tangwang   脚本优化
6
  
07cf5a93   tangwang   START_EMBEDDING=...
7
8
  PROJECT_ROOT="$(cd "$(dirname "$0")/.." && pwd)"
  cd "${PROJECT_ROOT}"
d1d356f8   tangwang   脚本优化
9
  
07cf5a93   tangwang   START_EMBEDDING=...
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
  RERANKER_VENV="${RERANKER_VENV:-${PROJECT_ROOT}/.venv-reranker}"
  PYTHON_BIN="${RERANKER_VENV}/bin/python"
  
  if [[ ! -x "${PYTHON_BIN}" ]]; then
    echo "ERROR: reranker venv not found: ${RERANKER_VENV}" >&2
    echo "Please run: ./scripts/setup_reranker_venv.sh" >&2
    exit 1
  fi
  
  # Load .env if present (without activating main venv)
  ENV_FILE="${PROJECT_ROOT}/.env"
  if [ -f "${ENV_FILE}" ]; then
    while IFS= read -r line || [ -n "${line}" ]; do
      line="${line%$'\r'}"
      [[ -z "${line//[[:space:]]/}" ]] && continue
      [[ "${line}" =~ ^[[:space:]]*# ]] && continue
      [[ "${line}" != *=* ]] && continue
  
      key="${line%%=*}"
      value="${line#*=}"
      key="${key#"${key%%[![:space:]]*}"}"
      key="${key%"${key##*[![:space:]]}"}"
      value="${value#"${value%%[![:space:]]*}"}"
  
      if [[ ${#value} -ge 2 ]]; then
        first="${value:0:1}"
        last="${value: -1}"
        if [[ ("${first}" == '"' && "${last}" == '"') || ("${first}" == "'" && "${last}" == "'") ]]; then
          value="${value:1:${#value}-2}"
        fi
      fi
  
      export "${key}=${value}"
    done < "${ENV_FILE}"
  fi
d1d356f8   tangwang   脚本优化
45
46
47
  
  RERANKER_HOST="${RERANKER_HOST:-0.0.0.0}"
  RERANKER_PORT="${RERANKER_PORT:-6007}"
07cf5a93   tangwang   START_EMBEDDING=...
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
  RERANK_BACKEND=$("${PYTHON_BIN}" -c "from config.services_config import get_rerank_backend_config; print(get_rerank_backend_config()[0])")
  
  # Keep vLLM/triton/torch caches out of system disk.
  RERANKER_RUNTIME_DIR="${RERANKER_RUNTIME_DIR:-${PROJECT_ROOT}/.runtime/reranker}"
  mkdir -p "${RERANKER_RUNTIME_DIR}/home" \
           "${RERANKER_RUNTIME_DIR}/cache" \
           "${RERANKER_RUNTIME_DIR}/config" \
           "${RERANKER_RUNTIME_DIR}/triton" \
           "${RERANKER_RUNTIME_DIR}/torch_compile" \
           "${RERANKER_RUNTIME_DIR}/tmp"
  export HOME="${RERANKER_RUNTIME_DIR}/home"
  export XDG_CACHE_HOME="${RERANKER_RUNTIME_DIR}/cache"
  export XDG_CONFIG_HOME="${RERANKER_RUNTIME_DIR}/config"
  export TRITON_CACHE_DIR="${RERANKER_RUNTIME_DIR}/triton"
  export TORCHINDUCTOR_CACHE_DIR="${RERANKER_RUNTIME_DIR}/torch_compile"
  export TMPDIR="${RERANKER_RUNTIME_DIR}/tmp"
  export VLLM_NO_USAGE_STATS="${VLLM_NO_USAGE_STATS:-1}"
  export PATH="${RERANKER_VENV}/bin:${PATH}"
  
  if [[ "${RERANK_BACKEND}" == "qwen3_vllm" ]]; then
    if ! command -v nvidia-smi >/dev/null 2>&1 || ! nvidia-smi >/dev/null 2>&1; then
      echo "ERROR: qwen3_vllm backend requires NVIDIA GPU, but nvidia-smi is unavailable." >&2
      exit 1
    fi
    if ! "${PYTHON_BIN}" - <<'PY'
  try:
      import vllm  # noqa: F401
      import torch
      if not torch.cuda.is_available():
          raise SystemExit(1)
  except Exception:
      raise SystemExit(1)
  PY
    then
      echo "ERROR: qwen3_vllm backend requires vllm + CUDA runtime in ${RERANKER_VENV}." >&2
      echo "Please run: ./scripts/setup_reranker_venv.sh and verify CUDA is available." >&2
      exit 1
    fi
  fi
d1d356f8   tangwang   脚本优化
87
88
89
90
  
  echo "========================================"
  echo "Starting Reranker Service"
  echo "========================================"
07cf5a93   tangwang   START_EMBEDDING=...
91
  echo "Python: ${PYTHON_BIN}"
d1d356f8   tangwang   脚本优化
92
93
  echo "Host: ${RERANKER_HOST}"
  echo "Port: ${RERANKER_PORT}"
07cf5a93   tangwang   START_EMBEDDING=...
94
95
  echo "Backend: ${RERANK_BACKEND}"
  echo "Runtime dir: ${RERANKER_RUNTIME_DIR}"
d1d356f8   tangwang   脚本优化
96
97
  echo
  
07cf5a93   tangwang   START_EMBEDDING=...
98
  exec "${PYTHON_BIN}" -m uvicorn reranker.server:app \
d1d356f8   tangwang   脚本优化
99
100
101
    --host "${RERANKER_HOST}" \
    --port "${RERANKER_PORT}" \
    --workers 1