Blame view

reranker/config.py 549 Bytes
d90e7428   tangwang   补充重排
1
2
  """Reranker service configuration (simple Python config)."""
  
d1d356f8   tangwang   脚本优化
3
4
  import os
  
d90e7428   tangwang   补充重排
5
6
7
  
  class RerankerConfig(object):
      # Server
d1d356f8   tangwang   脚本优化
8
9
      HOST = os.getenv("RERANKER_HOST", "0.0.0.0")
      PORT = int(os.getenv("RERANKER_PORT", 6007))
d90e7428   tangwang   补充重排
10
11
  
      # Model
07cf5a93   tangwang   START_EMBEDDING=...
12
      MODEL_NAME = "Qwen/Qwen3-Reranker-0.6B"
d90e7428   tangwang   补充重排
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
      DEVICE = None  # None -> auto (cuda if available)
      USE_FP16 = True
      BATCH_SIZE = 64
      MAX_LENGTH = 512
      CACHE_DIR = "./model_cache"
      ENABLE_WARMUP = True
  
      # Request limits
      MAX_DOCS = 1000
  
      # Output
      NORMALIZE = True
  
  
  CONFIG = RerankerConfig()