86d8358b
tangwang
config optimize
|
1
|
"""Reranker service compatibility config derived from unified app config."""
|
d90e7428
tangwang
补充重排
|
2
|
|
86d8358b
tangwang
config optimize
|
3
4
|
from __future__ import annotations
|
daa2690b
tangwang
漏斗参数调优&呈现优化
|
5
6
|
import os
|
86d8358b
tangwang
config optimize
|
7
|
from config.loader import get_app_config
|
d1d356f8
tangwang
脚本优化
|
8
|
|
d90e7428
tangwang
补充重排
|
9
10
|
class RerankerConfig(object):
|
86d8358b
tangwang
config optimize
|
11
12
|
def __init__(self) -> None:
app_config = get_app_config()
|
86d8358b
tangwang
config optimize
|
13
|
service = app_config.services.rerank
|
daa2690b
tangwang
漏斗参数调优&呈现优化
|
14
15
16
|
instance_name = str(os.getenv("RERANK_INSTANCE") or service.default_instance).strip() or service.default_instance
instance = service.get_instance(instance_name)
backend = service.get_backend_config(instance_name)
|
86d8358b
tangwang
config optimize
|
17
18
|
request = service.request
|
daa2690b
tangwang
漏斗参数调优&呈现优化
|
19
20
21
22
23
24
25
26
27
|
self.INSTANCE = instance_name
self.HOST = str(os.getenv("RERANKER_HOST") or instance.host)
self.PORT = int(os.getenv("RERANKER_PORT") or instance.port)
self.BACKEND = str(os.getenv("RERANK_BACKEND") or instance.backend)
self.RUNTIME_DIR = str(
os.getenv("RERANKER_RUNTIME_DIR")
or instance.runtime_dir
or f"./.runtime/reranker/{instance_name}"
)
|
86d8358b
tangwang
config optimize
|
28
29
30
31
32
33
34
35
36
37
38
|
self.MODEL_NAME = str(backend.get("model_name") or "Qwen/Qwen3-Reranker-0.6B")
self.DEVICE = backend.get("device")
self.USE_FP16 = bool(backend.get("use_fp16", True))
self.BATCH_SIZE = int(backend.get("batch_size", backend.get("infer_batch_size", 64)))
self.MAX_LENGTH = int(backend.get("max_length", 512))
self.CACHE_DIR = str(backend.get("cache_dir") or "./model_cache")
self.ENABLE_WARMUP = bool(backend.get("enable_warmup", True))
self.MAX_DOCS = int(request.get("max_docs", 1000))
self.NORMALIZE = bool(request.get("normalize", True))
|
d90e7428
tangwang
补充重排
|
39
40
41
|
CONFIG = RerankerConfig()
|