Blame view

config/config.yaml 13.8 KB
86d0e83d   tangwang   query翻译,根据源语言是否在索...
1
  runtime:
432d1c88   tangwang   评估框架
2
3
4
    environment: prod
    index_namespace: ''
    api_host: 0.0.0.0
86d0e83d   tangwang   query翻译,根据源语言是否在索...
5
    api_port: 6002
432d1c88   tangwang   评估框架
6
    indexer_host: 0.0.0.0
86d0e83d   tangwang   query翻译,根据源语言是否在索...
7
    indexer_port: 6004
432d1c88   tangwang   评估框架
8
    embedding_host: 0.0.0.0
86d0e83d   tangwang   query翻译,根据源语言是否在索...
9
10
11
    embedding_port: 6005
    embedding_text_port: 6005
    embedding_image_port: 6008
432d1c88   tangwang   评估框架
12
    translator_host: 0.0.0.0
86d0e83d   tangwang   query翻译,根据源语言是否在索...
13
    translator_port: 6006
432d1c88   tangwang   评估框架
14
    reranker_host: 0.0.0.0
86d0e83d   tangwang   query翻译,根据源语言是否在索...
15
    reranker_port: 6007
86d0e83d   tangwang   query翻译,根据源语言是否在索...
16
17
  infrastructure:
    elasticsearch:
432d1c88   tangwang   评估框架
18
      host: http://localhost:9200
86d0e83d   tangwang   query翻译,根据源语言是否在索...
19
20
21
      username: null
      password: null
    redis:
432d1c88   tangwang   评估框架
22
      host: localhost
86d0e83d   tangwang   query翻译,根据源语言是否在索...
23
24
25
26
27
28
29
      port: 6479
      snapshot_db: 0
      password: null
      socket_timeout: 1
      socket_connect_timeout: 1
      retry_on_timeout: false
      cache_expire_days: 720
432d1c88   tangwang   评估框架
30
31
      embedding_cache_prefix: embedding
      anchor_cache_prefix: product_anchors
86d0e83d   tangwang   query翻译,根据源语言是否在索...
32
33
34
35
36
37
38
39
40
41
      anchor_cache_expire_days: 30
    database:
      host: null
      port: 3306
      database: null
      username: null
      password: null
    secrets:
      dashscope_api_key: null
      deepl_auth_key: null
432d1c88   tangwang   评估框架
42
  es_index_name: search_products
86d0e83d   tangwang   query翻译,根据源语言是否在索...
43
  indexes: []
86d8358b   tangwang   config optimize
44
  assets:
432d1c88   tangwang   评估框架
45
    query_rewrite_dictionary_path: config/dictionaries/query_rewrite.dict
41f0b2e9   tangwang   product_enrich支持并发
46
47
  product_enrich:
    max_workers: 40
4d824a77   tangwang   所有租户共用一套统一配置.tena...
48
49
50
  es_settings:
    number_of_shards: 1
    number_of_replicas: 0
432d1c88   tangwang   评估框架
51
    refresh_interval: 30s
33839b37   tangwang   属性值参与搜索:
52
  field_boosts:
bd96cead   tangwang   1. 动态多语言字段与统一策略配置
53
    title: 3.0
69881ecb   tangwang   相关性调参、enrich内容解析优化
54
55
56
57
    qanchors: 2.5
    tags: 2.0
    category_name_text: 2.0
    category_path: 2.0
bd96cead   tangwang   1. 动态多语言字段与统一策略配置
58
    brief: 1.5
69881ecb   tangwang   相关性调参、enrich内容解析优化
59
    description: 1.5
e756b18e   tangwang   重构了文本召回构建器,现在每个 b...
60
    vendor: 1.5
69881ecb   tangwang   相关性调参、enrich内容解析优化
61
62
63
    option1_values: 1.5
    option2_values: 1.5
    option3_values: 1.5
4d824a77   tangwang   所有租户共用一套统一配置.tena...
64
  query_config:
4d824a77   tangwang   所有租户共用一套统一配置.tena...
65
    supported_languages:
432d1c88   tangwang   评估框架
66
67
68
    - zh
    - en
    default_language: en
4d824a77   tangwang   所有租户共用一套统一配置.tena...
69
70
    enable_text_embedding: true
    enable_query_rewrite: true
432d1c88   tangwang   评估框架
71
72
73
74
75
76
77
78
    zh_to_en_model: nllb-200-distilled-600m
    en_to_zh_model: nllb-200-distilled-600m
    default_translation_model: nllb-200-distilled-600m
    zh_to_en_model__source_not_in_index: nllb-200-distilled-600m
    en_to_zh_model__source_not_in_index: nllb-200-distilled-600m
    default_translation_model__source_not_in_index: nllb-200-distilled-600m
    translation_embedding_wait_budget_ms_source_in_index: 200
    translation_embedding_wait_budget_ms_source_not_in_index: 300
cda1cd62   tangwang   意图分析&应用 baseline
79
80
    style_intent:
      enabled: true
87cacb1b   tangwang   融合公式优化。加入意图匹配因子
81
      selected_sku_boost: 1.2
432d1c88   tangwang   评估框架
82
83
      color_dictionary_path: config/dictionaries/style_intent_color.csv
      size_dictionary_path: config/dictionaries/style_intent_size.csv
cda1cd62   tangwang   意图分析&应用 baseline
84
      dimension_aliases:
432d1c88   tangwang   评估框架
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
        color:
        - color
        - colors
        - colour
        - colours
        - 颜色
        - 
        - 色系
        size:
        - size
        - sizes
        - sizing
        - 尺码
        - 尺寸
        - 码数
        - 号码
        - 
74fdf9bd   tangwang   1.
102
103
    product_title_exclusion:
      enabled: true
432d1c88   tangwang   评估框架
104
      dictionary_path: config/dictionaries/product_title_exclusion.tsv
bd96cead   tangwang   1. 动态多语言字段与统一策略配置
105
106
    search_fields:
      multilingual_fields:
432d1c88   tangwang   评估框架
107
108
109
110
111
112
113
114
      - title
      - qanchors
      - category_path
      - category_name_text
      - brief
      - description
      - vendor
      shared_fields: null
bd96cead   tangwang   1. 动态多语言字段与统一策略配置
115
      core_multilingual_fields:
432d1c88   tangwang   评估框架
116
117
118
      - title
      - qanchors
      - category_name_text
bd96cead   tangwang   1. 动态多语言字段与统一策略配置
119
    text_query_strategy:
432d1c88   tangwang   评估框架
120
121
      base_minimum_should_match: 60%
      translation_minimum_should_match: 60%
69881ecb   tangwang   相关性调参、enrich内容解析优化
122
123
      translation_boost: 0.75
      tie_breaker_base_query: 0.5
e756b18e   tangwang   重构了文本召回构建器,现在每个 b...
124
125
126
127
128
129
130
131
132
      best_fields_boost: 2.0
      best_fields:
        title: 4.0
        qanchors: 3.0
        category_name_text: 2.0
      phrase_fields:
        title: 5.0
        qanchors: 4.0
      phrase_match_boost: 3.0
432d1c88   tangwang   评估框架
133
134
    text_embedding_field: title_embedding
    image_embedding_field: image_embedding.vector
a7cc9078   tangwang   sku排序
135
    source_fields:
432d1c88   tangwang   评估框架
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
    - spu_id
    - handle
    - title
    - brief
    - description
    - vendor
    - category_name
    - category_name_text
    - category_path
    - category_id
    - category_level
    - category1_name
    - category2_name
    - category3_name
    - tags
    - min_price
    - compare_at_price
    - image_url
    - sku_prices
    - sku_weights
    - sku_weight_units
    - total_inventory
    - option1_name
    - option1_values
    - option2_name
    - option2_values
    - option3_name
    - option3_values
    - specifications
    - skus
ceaf6d03   tangwang   召回限定:must条件补充主干词命...
166
167
    knn_text_boost: 4
    knn_image_boost: 4
de98daa3   tangwang   多模态召回优化
168
169
    knn_text_k: 160
    knn_text_num_candidates: 560
de98daa3   tangwang   多模态召回优化
170
171
    knn_text_k_long: 400
    knn_text_num_candidates_long: 1200
de98daa3   tangwang   多模态召回优化
172
173
    knn_image_k: 400
    knn_image_num_candidates: 1200
4d824a77   tangwang   所有租户共用一套统一配置.tena...
174
  function_score:
432d1c88   tangwang   评估框架
175
176
    score_mode: sum
    boost_mode: multiply
4d824a77   tangwang   所有租户共用一套统一配置.tena...
177
    functions: []
8c8b9d84   tangwang   ES 拉取 coarse_rank...
178
179
180
181
182
183
184
  coarse_rank:
    enabled: true
    input_window: 700
    output_window: 240
    fusion:
      text_bias: 0.1
      text_exponent: 0.35
de98daa3   tangwang   多模态召回优化
185
      text_translation_weight: 1.0
8c8b9d84   tangwang   ES 拉取 coarse_rank...
186
187
188
189
190
      knn_text_weight: 1.0
      knn_image_weight: 1.0
      knn_tie_breaker: 0.1
      knn_bias: 0.6
      knn_exponent: 0.0
8c8b9d84   tangwang   ES 拉取 coarse_rank...
191
  fine_rank:
418b6a4a   tangwang   调参
192
193
    enabled: false
    input_window: 160
8c8b9d84   tangwang   ES 拉取 coarse_rank...
194
195
    output_window: 80
    timeout_sec: 10.0
432d1c88   tangwang   评估框架
196
197
198
    rerank_query_template: '{query}'
    rerank_doc_template: '{title}'
    service_profile: fine
4d824a77   tangwang   所有租户共用一套统一配置.tena...
199
  rerank:
5f7d7f09   tangwang   性能测试报告.md
200
    enabled: true
418b6a4a   tangwang   调参
201
    rerank_window: 160
42e3aea6   tangwang   tidy
202
    timeout_sec: 15.0
506c39b7   tangwang   feat(search): 统一重...
203
204
    weight_es: 0.4
    weight_ai: 0.6
432d1c88   tangwang   评估框架
205
206
207
    rerank_query_template: '{query}'
    rerank_doc_template: '{title}'
    service_profile: default
814e352b   tangwang   乘法公式配置化
208
    fusion:
432d1c88   tangwang   评估框架
209
210
211
      rerank_bias: 1.0e-05
      rerank_exponent: 1.15
      fine_bias: 1.0e-05
8c8b9d84   tangwang   ES 拉取 coarse_rank...
212
      fine_exponent: 1.0
814e352b   tangwang   乘法公式配置化
213
      text_bias: 0.1
432d1c88   tangwang   评估框架
214
215
      text_exponent: 0.25
      text_translation_weight: 0.8
24edc208   tangwang   修改_extract_combin...
216
217
218
      knn_text_weight: 1.0
      knn_image_weight: 1.0
      knn_tie_breaker: 0.1
814e352b   tangwang   乘法公式配置化
219
      knn_bias: 0.6
ceaf6d03   tangwang   召回限定:must条件补充主干词命...
220
      knn_exponent: 0.0
42e3aea6   tangwang   tidy
221
222
  services:
    translation:
432d1c88   tangwang   评估框架
223
224
225
      service_url: http://127.0.0.1:6006
      default_model: nllb-200-distilled-600m
      default_scene: general
42e3aea6   tangwang   tidy
226
      timeout_sec: 10.0
d4cadc13   tangwang   翻译重构
227
      cache:
d4cadc13   tangwang   翻译重构
228
229
        ttl_seconds: 62208000
        sliding_expiration: true
8140e942   tangwang   translator model ...
230
        enable_model_quality_tier_cache: true
8140e942   tangwang   translator model ...
231
232
233
234
235
236
237
        model_quality_tiers:
          deepl: 30
          qwen-mt: 30
          llm: 30
          nllb-200-distilled-600m: 20
          opus-mt-zh-en: 10
          opus-mt-en-zh: 10
5e4dc8e4   tangwang   翻译架构按“一个翻译服务 +
238
      capabilities:
d4cadc13   tangwang   翻译重构
239
        qwen-mt:
5e4dc8e4   tangwang   翻译架构按“一个翻译服务 +
240
          enabled: true
432d1c88   tangwang   评估框架
241
242
243
          backend: qwen_mt
          model: qwen-mt-flash
          base_url: https://dashscope-us.aliyuncs.com/compatible-mode/v1
42e3aea6   tangwang   tidy
244
          timeout_sec: 10.0
5e4dc8e4   tangwang   翻译架构按“一个翻译服务 +
245
          use_cache: true
a0a173ae   tangwang   last
246
        llm:
5e4dc8e4   tangwang   翻译架构按“一个翻译服务 +
247
          enabled: true
432d1c88   tangwang   评估框架
248
249
250
          backend: llm
          model: qwen-flash
          base_url: https://dashscope-us.aliyuncs.com/compatible-mode/v1
a0a173ae   tangwang   last
251
          timeout_sec: 30.0
cd4ce66d   tangwang   trans logs
252
          use_cache: true
d4cadc13   tangwang   翻译重构
253
        deepl:
cd4ce66d   tangwang   trans logs
254
          enabled: true
432d1c88   tangwang   评估框架
255
256
          backend: deepl
          api_url: https://api.deepl.com/v2/translate
d4cadc13   tangwang   翻译重构
257
          timeout_sec: 10.0
432d1c88   tangwang   评估框架
258
          glossary_id: ''
cd4ce66d   tangwang   trans logs
259
          use_cache: true
0fd2f875   tangwang   translate
260
        nllb-200-distilled-600m:
93be98cb   tangwang   清理过时的文档
261
          enabled: true
432d1c88   tangwang   评估框架
262
263
264
265
266
267
          backend: local_nllb
          model_id: facebook/nllb-200-distilled-600M
          model_dir: ./models/translation/facebook/nllb-200-distilled-600M
          ct2_model_dir: ./models/translation/facebook/nllb-200-distilled-600M/ctranslate2-float16
          ct2_compute_type: float16
          ct2_conversion_quantization: float16
ea293660   tangwang   CTranslate2
268
          ct2_auto_convert: true
46ce858d   tangwang   在NLLB模型的 /data/sa...
269
          ct2_inter_threads: 4
ea293660   tangwang   CTranslate2
270
          ct2_intra_threads: 0
46ce858d   tangwang   在NLLB模型的 /data/sa...
271
          ct2_max_queued_batches: 32
432d1c88   tangwang   评估框架
272
273
          ct2_batch_type: examples
          ct2_decoding_length_mode: source
46ce858d   tangwang   在NLLB模型的 /data/sa...
274
275
          ct2_decoding_length_extra: 8
          ct2_decoding_length_min: 32
432d1c88   tangwang   评估框架
276
277
          device: cuda
          torch_dtype: float16
4747e2f4   tangwang   embedding perform...
278
          batch_size: 64
0fd2f875   tangwang   translate
279
          max_input_length: 256
3eff49b7   tangwang   trans nllb-200-di...
280
          max_new_tokens: 64
0fd2f875   tangwang   translate
281
          num_beams: 1
cd4ce66d   tangwang   trans logs
282
          use_cache: true
0fd2f875   tangwang   translate
283
        opus-mt-zh-en:
f86c5fee   tangwang   reranker性能参数脚本放在:...
284
          enabled: false
432d1c88   tangwang   评估框架
285
286
287
288
289
290
          backend: local_marian
          model_id: Helsinki-NLP/opus-mt-zh-en
          model_dir: ./models/translation/Helsinki-NLP/opus-mt-zh-en
          ct2_model_dir: ./models/translation/Helsinki-NLP/opus-mt-zh-en/ctranslate2-float16
          ct2_compute_type: float16
          ct2_conversion_quantization: float16
ea293660   tangwang   CTranslate2
291
292
293
294
          ct2_auto_convert: true
          ct2_inter_threads: 1
          ct2_intra_threads: 0
          ct2_max_queued_batches: 0
432d1c88   tangwang   评估框架
295
296
297
          ct2_batch_type: examples
          device: cuda
          torch_dtype: float16
0fd2f875   tangwang   translate
298
299
300
301
          batch_size: 16
          max_input_length: 256
          max_new_tokens: 256
          num_beams: 1
cd4ce66d   tangwang   trans logs
302
          use_cache: true
0fd2f875   tangwang   translate
303
        opus-mt-en-zh:
f86c5fee   tangwang   reranker性能参数脚本放在:...
304
          enabled: false
432d1c88   tangwang   评估框架
305
306
307
308
309
310
          backend: local_marian
          model_id: Helsinki-NLP/opus-mt-en-zh
          model_dir: ./models/translation/Helsinki-NLP/opus-mt-en-zh
          ct2_model_dir: ./models/translation/Helsinki-NLP/opus-mt-en-zh/ctranslate2-float16
          ct2_compute_type: float16
          ct2_conversion_quantization: float16
ea293660   tangwang   CTranslate2
311
312
313
314
          ct2_auto_convert: true
          ct2_inter_threads: 1
          ct2_intra_threads: 0
          ct2_max_queued_batches: 0
432d1c88   tangwang   评估框架
315
316
317
          ct2_batch_type: examples
          device: cuda
          torch_dtype: float16
0fd2f875   tangwang   translate
318
319
320
321
          batch_size: 16
          max_input_length: 256
          max_new_tokens: 256
          num_beams: 1
cd4ce66d   tangwang   trans logs
322
          use_cache: true
42e3aea6   tangwang   tidy
323
    embedding:
432d1c88   tangwang   评估框架
324
      provider: http
42e3aea6   tangwang   tidy
325
326
      providers:
        http:
432d1c88   tangwang   评估框架
327
328
329
          text_base_url: http://127.0.0.1:6005
          image_base_url: http://127.0.0.1:6008
      backend: tei
07cf5a93   tangwang   START_EMBEDDING=...
330
331
      backends:
        tei:
432d1c88   tangwang   评估框架
332
          base_url: http://127.0.0.1:8080
efd435cf   tangwang   tei性能调优:
333
          timeout_sec: 20
432d1c88   tangwang   评估框架
334
          model_id: Qwen/Qwen3-Embedding-0.6B
07cf5a93   tangwang   START_EMBEDDING=...
335
        local_st:
432d1c88   tangwang   评估框架
336
337
          model_id: Qwen/Qwen3-Embedding-0.6B
          device: cuda
07cf5a93   tangwang   START_EMBEDDING=...
338
339
          batch_size: 32
          normalize_embeddings: true
432d1c88   tangwang   评估框架
340
      image_backend: clip_as_service
86d8358b   tangwang   config optimize
341
342
      image_backends:
        clip_as_service:
432d1c88   tangwang   评估框架
343
344
          server: grpc://127.0.0.1:51000
          model_name: CN-CLIP/ViT-L-14
86d8358b   tangwang   config optimize
345
346
347
          batch_size: 8
          normalize_embeddings: true
        local_cnclip:
432d1c88   tangwang   评估框架
348
          model_name: ViT-L-14
86d8358b   tangwang   config optimize
349
350
351
          device: null
          batch_size: 8
          normalize_embeddings: true
42e3aea6   tangwang   tidy
352
    rerank:
432d1c88   tangwang   评估框架
353
      provider: http
42e3aea6   tangwang   tidy
354
355
      providers:
        http:
daa2690b   tangwang   漏斗参数调优&呈现优化
356
357
          instances:
            default:
432d1c88   tangwang   评估框架
358
359
              base_url: http://127.0.0.1:6007
              service_url: http://127.0.0.1:6007/rerank
daa2690b   tangwang   漏斗参数调优&呈现优化
360
            fine:
432d1c88   tangwang   评估框架
361
362
              base_url: http://127.0.0.1:6009
              service_url: http://127.0.0.1:6009/rerank
86d8358b   tangwang   config optimize
363
364
365
      request:
        max_docs: 1000
        normalize: true
432d1c88   tangwang   评估框架
366
      default_instance: default
daa2690b   tangwang   漏斗参数调优&呈现优化
367
368
      instances:
        default:
432d1c88   tangwang   评估框架
369
          host: 0.0.0.0
daa2690b   tangwang   漏斗参数调优&呈现优化
370
          port: 6007
432d1c88   tangwang   评估框架
371
372
          backend: qwen3_vllm_score
          runtime_dir: ./.runtime/reranker/default
daa2690b   tangwang   漏斗参数调优&呈现优化
373
        fine:
432d1c88   tangwang   评估框架
374
          host: 0.0.0.0
daa2690b   tangwang   漏斗参数调优&呈现优化
375
          port: 6009
432d1c88   tangwang   评估框架
376
377
          backend: bge
          runtime_dir: ./.runtime/reranker/fine
701ae503   tangwang   docs
378
379
      backends:
        bge:
432d1c88   tangwang   评估框架
380
          model_name: BAAI/bge-reranker-v2-m3
701ae503   tangwang   docs
381
382
          device: null
          use_fp16: true
418b6a4a   tangwang   调参
383
          batch_size: 80
00c8ddb9   tangwang   suggest rank opti...
384
          max_length: 160
432d1c88   tangwang   评估框架
385
          cache_dir: ./model_cache
701ae503   tangwang   docs
386
          enable_warmup: true
971a0851   tangwang   补充reranker-jina,探...
387
        jina_reranker_v3:
432d1c88   tangwang   评估框架
388
          model_name: jinaai/jina-reranker-v3
971a0851   tangwang   补充reranker-jina,探...
389
          device: null
432d1c88   tangwang   评估框架
390
          dtype: float16
971a0851   tangwang   补充reranker-jina,探...
391
          batch_size: 64
74116f05   tangwang   jina-reranker-v3性...
392
393
394
          max_doc_length: 160
          max_query_length: 64
          sort_by_doc_length: true
432d1c88   tangwang   评估框架
395
          cache_dir: ./model_cache
971a0851   tangwang   补充reranker-jina,探...
396
          trust_remote_code: true
701ae503   tangwang   docs
397
        qwen3_vllm:
432d1c88   tangwang   评估框架
398
399
          model_name: Qwen/Qwen3-Reranker-0.6B
          engine: vllm
b0972ff9   tangwang   qwen3_vllm_score ...
400
          max_model_len: 256
701ae503   tangwang   docs
401
          tensor_parallel_size: 1
432d1c88   tangwang   评估框架
402
403
          gpu_memory_utilization: 0.2
          dtype: float16
bc089b43   tangwang   refactor(reranker...
404
405
          enable_prefix_caching: true
          enforce_eager: false
00c8ddb9   tangwang   suggest rank opti...
406
          infer_batch_size: 100
9f5994b4   tangwang   reranker
407
          sort_by_doc_length: true
432d1c88   tangwang   评估框架
408
409
          instruction_format: standard
          instruction: rank products by given query
9de5ef49   tangwang   qwen3_vllm_score ...
410
        qwen3_vllm_score:
432d1c88   tangwang   评估框架
411
          model_name: Qwen/Qwen3-Reranker-0.6B
9de5ef49   tangwang   qwen3_vllm_score ...
412
          use_original_qwen3_hf_overrides: true
432d1c88   tangwang   评估框架
413
          engine: vllm
f86c5fee   tangwang   reranker性能参数脚本放在:...
414
          max_model_len: 172
9de5ef49   tangwang   qwen3_vllm_score ...
415
          tensor_parallel_size: 1
c3425429   tangwang   在以下文件中完成精排/融合清理工作...
416
          gpu_memory_utilization: 0.15
432d1c88   tangwang   评估框架
417
          dtype: float16
9de5ef49   tangwang   qwen3_vllm_score ...
418
419
          enable_prefix_caching: true
          enforce_eager: false
3b35f139   tangwang   search evalution
420
          infer_batch_size: 80
9de5ef49   tangwang   qwen3_vllm_score ...
421
          sort_by_doc_length: true
432d1c88   tangwang   评估框架
422
423
          instruction_format: standard
          instruction: Rank products by query with category & style match prioritized
d31c7f65   tangwang   补充云服务reranker
424
        qwen3_transformers:
432d1c88   tangwang   评估框架
425
426
          model_name: Qwen/Qwen3-Reranker-0.6B
          instruction: rank products by given query
d31c7f65   tangwang   补充云服务reranker
427
428
429
          max_length: 8192
          batch_size: 64
          use_fp16: true
432d1c88   tangwang   评估框架
430
          attn_implementation: sdpa
4823f463   tangwang   qwen3_vllm_score ...
431
        qwen3_transformers_packed:
432d1c88   tangwang   评估框架
432
433
          model_name: Qwen/Qwen3-Reranker-0.6B
          instruction: Rank products by query with category & style match prioritized
b0972ff9   tangwang   qwen3_vllm_score ...
434
          max_model_len: 256
4823f463   tangwang   qwen3_vllm_score ...
435
436
437
438
          max_doc_len: 160
          max_docs_per_pack: 0
          use_fp16: true
          sort_by_doc_length: true
432d1c88   tangwang   评估框架
439
          attn_implementation: eager
3d508beb   tangwang   reranker-4b-gguf
440
        qwen3_gguf:
432d1c88   tangwang   评估框架
441
442
443
444
445
          repo_id: DevQuasar/Qwen.Qwen3-Reranker-4B-GGUF
          filename: '*Q8_0.gguf'
          cache_dir: ./model_cache
          local_dir: ./models/reranker/qwen3-reranker-4b-gguf
          instruction: Rank products by query with category & style match prioritized
5c21a485   tangwang   qwen3-reranker-0....
446
447
448
449
          n_ctx: 512
          n_batch: 512
          n_ubatch: 512
          n_gpu_layers: 999
3d508beb   tangwang   reranker-4b-gguf
450
451
452
453
454
455
456
457
458
          main_gpu: 0
          n_threads: 2
          n_threads_batch: 4
          flash_attn: true
          offload_kqv: true
          use_mmap: true
          use_mlock: false
          infer_batch_size: 8
          sort_by_doc_length: true
432d1c88   tangwang   评估框架
459
          length_sort_mode: char
3d508beb   tangwang   reranker-4b-gguf
460
461
          enable_warmup: true
          verbose: false
5c21a485   tangwang   qwen3-reranker-0....
462
        qwen3_gguf_06b:
432d1c88   tangwang   评估框架
463
464
465
466
467
          repo_id: ggml-org/Qwen3-Reranker-0.6B-Q8_0-GGUF
          filename: qwen3-reranker-0.6b-q8_0.gguf
          cache_dir: ./model_cache
          local_dir: ./models/reranker/qwen3-reranker-0.6b-q8_0-gguf
          instruction: Rank products by query with category & style match prioritized
5c21a485   tangwang   qwen3-reranker-0....
468
469
470
471
472
473
474
475
476
477
478
479
480
          n_ctx: 256
          n_batch: 256
          n_ubatch: 256
          n_gpu_layers: 999
          main_gpu: 0
          n_threads: 2
          n_threads_batch: 4
          flash_attn: true
          offload_kqv: true
          use_mmap: true
          use_mlock: false
          infer_batch_size: 32
          sort_by_doc_length: true
432d1c88   tangwang   评估框架
481
          length_sort_mode: char
5c21a485   tangwang   qwen3-reranker-0....
482
483
484
          reuse_query_state: false
          enable_warmup: true
          verbose: false
d31c7f65   tangwang   补充云服务reranker
485
        dashscope_rerank:
432d1c88   tangwang   评估框架
486
487
488
489
490
491
492
          model_name: qwen3-rerank
          endpoint: https://dashscope.aliyuncs.com/compatible-api/v1/reranks
          api_key_env: RERANK_DASHSCOPE_API_KEY_CN
          timeout_sec: 10.0
          top_n_cap: 0
          batchsize: 64
          instruct: Given a shopping query, rank product titles by relevance
d31c7f65   tangwang   补充云服务reranker
493
494
          max_retries: 2
          retry_backoff_sec: 0.2
4d824a77   tangwang   所有租户共用一套统一配置.tena...
495
496
  spu_config:
    enabled: true
432d1c88   tangwang   评估框架
497
    spu_field: spu_id
4d824a77   tangwang   所有租户共用一套统一配置.tena...
498
    inner_hits_size: 10
432d1c88   tangwang   评估框架
499
500
501
502
    searchable_option_dimensions:
    - option1
    - option2
    - option3
0064e946   tangwang   feat: 增量索引服务、租户配置...
503
  tenant_config:
0064e946   tangwang   feat: 增量索引服务、租户配置...
504
    default:
432d1c88   tangwang   评估框架
505
506
507
508
      primary_language: en
      index_languages:
      - en
      - zh
0064e946   tangwang   feat: 增量索引服务、租户配置...
509
    tenants:
432d1c88   tangwang   评估框架
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
      '1':
        primary_language: zh
        index_languages:
        - zh
        - en
      '2':
        primary_language: en
        index_languages:
        - en
        - zh
      '3':
        primary_language: zh
        index_languages:
        - zh
        - en
      '162':
        primary_language: zh
        index_languages:
        - zh
        - en
      '170':
        primary_language: en
        index_languages:
        - en
        - zh