7bfb9946
tangwang
向量化模块
|
1
2
3
4
5
6
7
8
9
10
|
"""
Embedding module configuration.
This module is intentionally a plain Python file (no env var parsing, no extra deps).
Edit values here to configure:
- server host/port
- local model settings (paths/devices/batch sizes)
"""
from typing import Optional
|
d1d356f8
tangwang
脚本优化
|
11
|
import os
|
7bfb9946
tangwang
向量化模块
|
12
13
14
15
|
class EmbeddingConfig(object):
# Server
|
d1d356f8
tangwang
脚本优化
|
16
17
|
HOST = os.getenv("EMBEDDING_HOST", "0.0.0.0")
PORT = int(os.getenv("EMBEDDING_PORT", 6005))
|
7bfb9946
tangwang
向量化模块
|
18
|
|
07cf5a93
tangwang
START_EMBEDDING=...
|
19
|
# Text backend defaults
|
950a640e
tangwang
embeddings
|
20
|
TEXT_MODEL_ID = os.getenv("TEXT_MODEL_ID", "Qwen/Qwen3-Embedding-0.6B")
|
af03fdef
tangwang
embedding模块代码整理
|
21
|
# Keep TEXT_MODEL_DIR as an alias so code can refer to one canonical text model value.
|
950a640e
tangwang
embeddings
|
22
23
24
25
|
TEXT_MODEL_DIR = TEXT_MODEL_ID
TEXT_DEVICE = os.getenv("TEXT_DEVICE", "cuda") # "cuda" or "cpu"
TEXT_BATCH_SIZE = int(os.getenv("TEXT_BATCH_SIZE", "32"))
TEXT_NORMALIZE_EMBEDDINGS = os.getenv("TEXT_NORMALIZE_EMBEDDINGS", "true").lower() in ("1", "true", "yes")
|
07cf5a93
tangwang
START_EMBEDDING=...
|
26
27
|
TEI_BASE_URL = os.getenv("TEI_BASE_URL", "http://127.0.0.1:8080")
TEI_TIMEOUT_SEC = int(os.getenv("TEI_TIMEOUT_SEC", "60"))
|
7bfb9946
tangwang
向量化模块
|
28
|
|
c10f90fe
tangwang
cnclip
|
29
30
31
32
|
# Image embeddings
# Option A: clip-as-service (Jina CLIP server, recommended)
USE_CLIP_AS_SERVICE = os.getenv("USE_CLIP_AS_SERVICE", "true").lower() in ("1", "true", "yes")
CLIP_AS_SERVICE_SERVER = os.getenv("CLIP_AS_SERVICE_SERVER", "grpc://127.0.0.1:51000")
|
4747e2f4
tangwang
embedding perform...
|
33
|
CLIP_AS_SERVICE_MODEL_NAME = os.getenv("CLIP_AS_SERVICE_MODEL_NAME", "CN-CLIP/ViT-L-14")
|
c10f90fe
tangwang
cnclip
|
34
35
|
# Option B: local CN-CLIP (when USE_CLIP_AS_SERVICE=false)
|
4747e2f4
tangwang
embedding perform...
|
36
|
IMAGE_MODEL_NAME = os.getenv("IMAGE_MODEL_NAME", "ViT-L-14")
|
7bfb9946
tangwang
向量化模块
|
37
38
39
40
|
IMAGE_DEVICE = None # type: Optional[str] # "cuda" / "cpu" / None(auto)
# Service behavior
IMAGE_BATCH_SIZE = 8
|
200fdddf
tangwang
embed norm
|
41
|
IMAGE_NORMALIZE_EMBEDDINGS = os.getenv("IMAGE_NORMALIZE_EMBEDDINGS", "true").lower() in ("1", "true", "yes")
|
7bfb9946
tangwang
向量化模块
|
42
43
44
|
CONFIG = EmbeddingConfig()
|