Blame view

config/config_loader.py 16.9 KB
be52af70   tangwang   first commit
1
  """
9cb7528e   tangwang   店匠体系数据的搜索:mock da...
2
  Configuration loader and validator for search engine configurations.
be52af70   tangwang   first commit
3
4
  
  This module handles loading, parsing, and validating YAML configuration files
33839b37   tangwang   属性值参与搜索:
5
6
7
8
  that define how search should be executed (NOT how data should be indexed).
  
  索引结构由 mappings/search_products.json 定义。
  此配置只定义搜索行为:字段权重、搜索域、查询策略等。
be52af70   tangwang   first commit
9
10
11
12
13
14
15
16
  """
  
  import yaml
  import os
  from typing import Dict, Any, List, Optional
  from dataclasses import dataclass, field
  from pathlib import Path
  
be52af70   tangwang   first commit
17
18
19
20
21
22
  
  @dataclass
  class IndexConfig:
      """Configuration for an index domain (e.g., default, title, brand)."""
      name: str
      label: str
33839b37   tangwang   属性值参与搜索:
23
      fields: List[str]  # List of field names to include in this search domain
be52af70   tangwang   first commit
24
25
26
      boost: float = 1.0
      example: Optional[str] = None
  
be52af70   tangwang   first commit
27
28
29
30
31
  
  @dataclass
  class QueryConfig:
      """Configuration for query processing."""
      supported_languages: List[str] = field(default_factory=lambda: ["zh", "en"])
2739b281   tangwang   多语言索引调整
32
      default_language: str = "en"
33839b37   tangwang   属性值参与搜索:
33
34
      
      # Feature flags
be52af70   tangwang   first commit
35
36
      enable_text_embedding: bool = True
      enable_query_rewrite: bool = True
7bc756c5   tangwang   优化 ES 查询构建
37
      enable_multilang_search: bool = True  # Enable multi-language search using translations
33839b37   tangwang   属性值参与搜索:
38
39
      
      # Query rewrite dictionary (loaded from external file)
be52af70   tangwang   first commit
40
      rewrite_dictionary: Dict[str, str] = field(default_factory=dict)
33839b37   tangwang   属性值参与搜索:
41
42
43
      
      # Translation settings
      translation_service: str = "deepl"
be52af70   tangwang   first commit
44
      translation_api_key: Optional[str] = None
33839b37   tangwang   属性值参与搜索:
45
46
      translation_glossary_id: Optional[str] = None
      translation_context: str = "e-commerce product search"
0064e946   tangwang   feat: 增量索引服务、租户配置...
47
      translation_prompts: Dict[str, str] = field(default_factory=dict)  # Translation prompts for different use cases
33839b37   tangwang   属性值参与搜索:
48
49
50
51
52
      
      # Embedding field names
      text_embedding_field: Optional[str] = "title_embedding"
      image_embedding_field: Optional[str] = None
      
9f96d6f3   tangwang   短query不用语义搜索
53
      # Embedding disable thresholds (disable vector search for short queries)
33839b37   tangwang   属性值参与搜索:
54
55
56
57
      embedding_disable_chinese_char_limit: int = 4
      embedding_disable_english_word_limit: int = 3
      
      # Source fields configuration
cd3799c6   tangwang   tenant2 1w测试数据 mo...
58
      source_fields: Optional[List[str]] = None
70dab99f   tangwang   add logs
59
60
61
      
      # KNN boost configuration
      knn_boost: float = 0.25  # Boost value for KNN (embedding recall)
13377199   tangwang   接口优化
62
  
be52af70   tangwang   first commit
63
64
65
66
67
  
  @dataclass
  class SPUConfig:
      """Configuration for SPU aggregation."""
      enabled: bool = False
33839b37   tangwang   属性值参与搜索:
68
      spu_field: Optional[str] = None
be52af70   tangwang   first commit
69
      inner_hits_size: int = 3
33839b37   tangwang   属性值参与搜索:
70
71
      # 配置哪些option维度参与检索(进索引、以及在线搜索)
      searchable_option_dimensions: List[str] = field(default_factory=lambda: ['option1', 'option2', 'option3'])
be52af70   tangwang   first commit
72
73
74
  
  
  @dataclass
a00c3672   tangwang   feat: Function Sc...
75
76
  class FunctionScoreConfig:
      """Function Score配置(ES层打分规则)"""
33839b37   tangwang   属性值参与搜索:
77
78
      score_mode: str = "sum"
      boost_mode: str = "multiply"
a00c3672   tangwang   feat: Function Sc...
79
80
81
82
      functions: List[Dict[str, Any]] = field(default_factory=list)
  
  
  @dataclass
33839b37   tangwang   属性值参与搜索:
83
84
85
86
87
88
89
  class RankingConfig:
      """Configuration for ranking expressions."""
      expression: str = "bm25()"
      description: str = "Default BM25 ranking"
  
  
  @dataclass
a00c3672   tangwang   feat: Function Sc...
90
  class RerankConfig:
506c39b7   tangwang   feat(search): 统一重...
91
92
93
94
95
96
97
98
      """重排配置(唯一实现:调用外部 BGE 重排服务,由请求参数 ai_search 控制是否执行)"""
      # 重排窗口:ai_search 且 from+size<=rerank_window 时,从 ES 取前 rerank_window 条重排后再分页
      rerank_window: int = 1000
      # 可选:重排服务 URL,为空时使用 reranker 模块默认端口 6007
      service_url: Optional[str] = None
      timeout_sec: float = 15.0
      weight_es: float = 0.4
      weight_ai: float = 0.6
a00c3672   tangwang   feat: Function Sc...
99
100
101
  
  
  @dataclass
9cb7528e   tangwang   店匠体系数据的搜索:mock da...
102
  class SearchConfig:
4d824a77   tangwang   所有租户共用一套统一配置.tena...
103
      """Complete configuration for search engine (multi-tenant)."""
33839b37   tangwang   属性值参与搜索:
104
105
106
107
      
      # 字段权重配置(用于搜索)
      field_boosts: Dict[str, float]
      
be52af70   tangwang   first commit
108
109
      # Index structure (query domains)
      indexes: List[IndexConfig]
33839b37   tangwang   属性值参与搜索:
110
      
be52af70   tangwang   first commit
111
112
      # Query processing
      query_config: QueryConfig
33839b37   tangwang   属性值参与搜索:
113
      
be52af70   tangwang   first commit
114
115
      # Ranking configuration
      ranking: RankingConfig
33839b37   tangwang   属性值参与搜索:
116
      
a00c3672   tangwang   feat: Function Sc...
117
118
      # Function Score configuration (ES层打分)
      function_score: FunctionScoreConfig
33839b37   tangwang   属性值参与搜索:
119
      
a00c3672   tangwang   feat: Function Sc...
120
121
      # Rerank configuration (本地重排)
      rerank: RerankConfig
33839b37   tangwang   属性值参与搜索:
122
      
be52af70   tangwang   first commit
123
124
      # SPU configuration
      spu_config: SPUConfig
33839b37   tangwang   属性值参与搜索:
125
      
be52af70   tangwang   first commit
126
127
      # ES index settings
      es_index_name: str
0064e946   tangwang   feat: 增量索引服务、租户配置...
128
129
130
131
132
      
      # Tenant configuration
      tenant_config: Dict[str, Any] = field(default_factory=dict)
      
      # ES settings
be52af70   tangwang   first commit
133
134
135
136
137
138
139
140
141
      es_settings: Dict[str, Any] = field(default_factory=dict)
  
  
  class ConfigurationError(Exception):
      """Raised when configuration validation fails."""
      pass
  
  
  class ConfigLoader:
4d824a77   tangwang   所有租户共用一套统一配置.tena...
142
      """Loads and validates unified search engine configuration from YAML file."""
a77693fe   tangwang   调整配置目录结构
143
      
33839b37   tangwang   属性值参与搜索:
144
      def __init__(self, config_file: Optional[Path] = None):
a77693fe   tangwang   调整配置目录结构
145
          """
33839b37   tangwang   属性值参与搜索:
146
          Initialize config loader.
a77693fe   tangwang   调整配置目录结构
147
          
33839b37   tangwang   属性值参与搜索:
148
149
          Args:
              config_file: Path to config YAML file (defaults to config/config.yaml)
a77693fe   tangwang   调整配置目录结构
150
          """
33839b37   tangwang   属性值参与搜索:
151
152
153
154
155
156
157
158
          if config_file is None:
              config_file = Path(__file__).parent / "config.yaml"
          self.config_file = Path(config_file)
      
      def _load_rewrite_dictionary(self) -> Dict[str, str]:
          """Load query rewrite dictionary from external file."""
          rewrite_file = Path(__file__).parent / "rewrite_dictionary.txt"
          rewrite_dict = {}
a77693fe   tangwang   调整配置目录结构
159
          
33839b37   tangwang   属性值参与搜索:
160
161
          if not rewrite_file.exists():
              return rewrite_dict
a77693fe   tangwang   调整配置目录结构
162
          
a77693fe   tangwang   调整配置目录结构
163
          try:
33839b37   tangwang   属性值参与搜索:
164
165
              with open(rewrite_file, 'r', encoding='utf-8') as f:
                  for line in f:
a77693fe   tangwang   调整配置目录结构
166
                      line = line.strip()
a77693fe   tangwang   调整配置目录结构
167
168
169
                      if not line or line.startswith('#'):
                          continue
                      
a77693fe   tangwang   调整配置目录结构
170
                      parts = line.split('\t')
33839b37   tangwang   属性值参与搜索:
171
172
173
174
175
                      if len(parts) >= 2:
                          original = parts[0].strip()
                          replacement = parts[1].strip()
                          if original and replacement:
                              rewrite_dict[original] = replacement
a77693fe   tangwang   调整配置目录结构
176
          except Exception as e:
33839b37   tangwang   属性值参与搜索:
177
              print(f"Warning: Failed to load rewrite dictionary: {e}")
a77693fe   tangwang   调整配置目录结构
178
179
          
          return rewrite_dict
33839b37   tangwang   属性值参与搜索:
180
      
9f96d6f3   tangwang   短query不用语义搜索
181
      def load_config(self, validate: bool = True) -> SearchConfig:
be52af70   tangwang   first commit
182
          """
4d824a77   tangwang   所有租户共用一套统一配置.tena...
183
          Load unified configuration from YAML file.
33839b37   tangwang   属性值参与搜索:
184
          
9f96d6f3   tangwang   短query不用语义搜索
185
          Args:
33839b37   tangwang   属性值参与搜索:
186
187
              validate: Whether to validate configuration after loading
          
be52af70   tangwang   first commit
188
          Returns:
9cb7528e   tangwang   店匠体系数据的搜索:mock da...
189
              SearchConfig object
33839b37   tangwang   属性值参与搜索:
190
          
be52af70   tangwang   first commit
191
          Raises:
9f96d6f3   tangwang   短query不用语义搜索
192
              ConfigurationError: If config file not found, invalid, or validation fails
be52af70   tangwang   first commit
193
          """
4d824a77   tangwang   所有租户共用一套统一配置.tena...
194
195
          if not self.config_file.exists():
              raise ConfigurationError(f"Configuration file not found: {self.config_file}")
33839b37   tangwang   属性值参与搜索:
196
          
be52af70   tangwang   first commit
197
          try:
4d824a77   tangwang   所有租户共用一套统一配置.tena...
198
              with open(self.config_file, 'r', encoding='utf-8') as f:
be52af70   tangwang   first commit
199
200
                  config_data = yaml.safe_load(f)
          except yaml.YAMLError as e:
4d824a77   tangwang   所有租户共用一套统一配置.tena...
201
              raise ConfigurationError(f"Invalid YAML in {self.config_file}: {e}")
33839b37   tangwang   属性值参与搜索:
202
          
9f96d6f3   tangwang   短query不用语义搜索
203
204
205
206
207
208
209
210
211
212
          config = self._parse_config(config_data)
          
          # Auto-validate configuration
          if validate:
              errors = self.validate_config(config)
              if errors:
                  error_msg = "Configuration validation failed:\n" + "\n".join(f"  - {err}" for err in errors)
                  raise ConfigurationError(error_msg)
          
          return config
33839b37   tangwang   属性值参与搜索:
213
      
9cb7528e   tangwang   店匠体系数据的搜索:mock da...
214
215
      def _parse_config(self, config_data: Dict[str, Any]) -> SearchConfig:
          """Parse configuration dictionary into SearchConfig object."""
33839b37   tangwang   属性值参与搜索:
216
217
218
219
220
221
          
          # Parse field_boosts
          field_boosts = config_data.get("field_boosts", {})
          if not isinstance(field_boosts, dict):
              raise ConfigurationError("field_boosts must be a dictionary")
          
be52af70   tangwang   first commit
222
223
224
225
          # Parse indexes
          indexes = []
          for index_data in config_data.get("indexes", []):
              indexes.append(self._parse_index_config(index_data))
33839b37   tangwang   属性值参与搜索:
226
          
be52af70   tangwang   first commit
227
228
          # Parse query config
          query_config_data = config_data.get("query_config", {})
a77693fe   tangwang   调整配置目录结构
229
          
33839b37   tangwang   属性值参与搜索:
230
          # Load rewrite dictionary from external file
4d824a77   tangwang   所有租户共用一套统一配置.tena...
231
          rewrite_dictionary = self._load_rewrite_dictionary()
a77693fe   tangwang   调整配置目录结构
232
          
9f96d6f3   tangwang   短query不用语义搜索
233
234
235
          # Parse embedding disable thresholds
          embedding_thresholds = query_config_data.get("embedding_disable_thresholds", {})
          
be52af70   tangwang   first commit
236
          query_config = QueryConfig(
9f96d6f3   tangwang   短query不用语义搜索
237
              supported_languages=query_config_data.get("supported_languages") or ["zh", "en"],
2739b281   tangwang   多语言索引调整
238
              default_language=query_config_data.get("default_language") or "en",
be52af70   tangwang   first commit
239
240
              enable_text_embedding=query_config_data.get("enable_text_embedding", True),
              enable_query_rewrite=query_config_data.get("enable_query_rewrite", True),
a77693fe   tangwang   调整配置目录结构
241
              rewrite_dictionary=rewrite_dictionary,
be52af70   tangwang   first commit
242
              translation_api_key=query_config_data.get("translation_api_key"),
9f96d6f3   tangwang   短query不用语义搜索
243
              translation_service=query_config_data.get("translation_service") or "deepl",
522a3964   tangwang   多语言搜索翻译的优化(deepL添...
244
              translation_glossary_id=query_config_data.get("translation_glossary_id"),
9f96d6f3   tangwang   短query不用语义搜索
245
              translation_context=query_config_data.get("translation_context") or "e-commerce product search",
0064e946   tangwang   feat: 增量索引服务、租户配置...
246
              translation_prompts=query_config_data.get("translation_prompts", {}),
325eec03   tangwang   1. 日志、配置基础设施,使用优化
247
              text_embedding_field=query_config_data.get("text_embedding_field"),
cd3799c6   tangwang   tenant2 1w测试数据 mo...
248
              image_embedding_field=query_config_data.get("image_embedding_field"),
9f96d6f3   tangwang   短query不用语义搜索
249
250
              embedding_disable_chinese_char_limit=embedding_thresholds.get("chinese_char_limit", 4),
              embedding_disable_english_word_limit=embedding_thresholds.get("english_word_limit", 3),
70dab99f   tangwang   add logs
251
252
              source_fields=query_config_data.get("source_fields"),
              knn_boost=query_config_data.get("knn_boost", 0.25)
be52af70   tangwang   first commit
253
          )
33839b37   tangwang   属性值参与搜索:
254
          
be52af70   tangwang   first commit
255
256
257
          # Parse ranking config
          ranking_data = config_data.get("ranking", {})
          ranking = RankingConfig(
9f96d6f3   tangwang   短query不用语义搜索
258
259
              expression=ranking_data.get("expression") or "bm25() + 0.2*text_embedding_relevance()",
              description=ranking_data.get("description") or "Default BM25 + text embedding ranking"
be52af70   tangwang   first commit
260
          )
33839b37   tangwang   属性值参与搜索:
261
          
a00c3672   tangwang   feat: Function Sc...
262
263
264
          # Parse Function Score configuration
          fs_data = config_data.get("function_score", {})
          function_score = FunctionScoreConfig(
9f96d6f3   tangwang   短query不用语义搜索
265
266
267
              score_mode=fs_data.get("score_mode") or "sum",
              boost_mode=fs_data.get("boost_mode") or "multiply",
              functions=fs_data.get("functions") or []
a00c3672   tangwang   feat: Function Sc...
268
          )
33839b37   tangwang   属性值参与搜索:
269
          
506c39b7   tangwang   feat(search): 统一重...
270
          # Parse Rerank configuration(唯一实现:外部重排服务,由 ai_search 控制)
a00c3672   tangwang   feat: Function Sc...
271
272
          rerank_data = config_data.get("rerank", {})
          rerank = RerankConfig(
506c39b7   tangwang   feat(search): 统一重...
273
274
275
276
277
              rerank_window=int(rerank_data.get("rerank_window", 1000)),
              service_url=rerank_data.get("service_url") or None,
              timeout_sec=float(rerank_data.get("timeout_sec", 15.0)),
              weight_es=float(rerank_data.get("weight_es", 0.4)),
              weight_ai=float(rerank_data.get("weight_ai", 0.6)),
a00c3672   tangwang   feat: Function Sc...
278
          )
33839b37   tangwang   属性值参与搜索:
279
          
be52af70   tangwang   first commit
280
281
282
283
284
          # Parse SPU config
          spu_data = config_data.get("spu_config", {})
          spu_config = SPUConfig(
              enabled=spu_data.get("enabled", False),
              spu_field=spu_data.get("spu_field"),
33839b37   tangwang   属性值参与搜索:
285
286
              inner_hits_size=spu_data.get("inner_hits_size", 3),
              searchable_option_dimensions=spu_data.get("searchable_option_dimensions", ['option1', 'option2', 'option3'])
be52af70   tangwang   first commit
287
          )
33839b37   tangwang   属性值参与搜索:
288
          
0064e946   tangwang   feat: 增量索引服务、租户配置...
289
290
291
          # Parse tenant config
          tenant_config_data = config_data.get("tenant_config", {})
          
9cb7528e   tangwang   店匠体系数据的搜索:mock da...
292
          return SearchConfig(
33839b37   tangwang   属性值参与搜索:
293
              field_boosts=field_boosts,
be52af70   tangwang   first commit
294
295
296
              indexes=indexes,
              query_config=query_config,
              ranking=ranking,
a00c3672   tangwang   feat: Function Sc...
297
298
              function_score=function_score,
              rerank=rerank,
be52af70   tangwang   first commit
299
              spu_config=spu_config,
0064e946   tangwang   feat: 增量索引服务、租户配置...
300
              tenant_config=tenant_config_data,
4d824a77   tangwang   所有租户共用一套统一配置.tena...
301
              es_index_name=config_data.get("es_index_name", "search_products"),
be52af70   tangwang   first commit
302
303
              es_settings=config_data.get("es_settings", {})
          )
33839b37   tangwang   属性值参与搜索:
304
      
be52af70   tangwang   first commit
305
306
      def _parse_index_config(self, index_data: Dict[str, Any]) -> IndexConfig:
          """Parse index configuration from dictionary."""
be52af70   tangwang   first commit
307
308
309
          return IndexConfig(
              name=index_data["name"],
              label=index_data.get("label", index_data["name"]),
33839b37   tangwang   属性值参与搜索:
310
              fields=index_data.get("fields", []),
be52af70   tangwang   first commit
311
              boost=index_data.get("boost", 1.0),
33839b37   tangwang   属性值参与搜索:
312
              example=index_data.get("example")
be52af70   tangwang   first commit
313
          )
33839b37   tangwang   属性值参与搜索:
314
      
9cb7528e   tangwang   店匠体系数据的搜索:mock da...
315
      def validate_config(self, config: SearchConfig) -> List[str]:
be52af70   tangwang   first commit
316
          """
33839b37   tangwang   属性值参与搜索:
317
318
          Validate configuration for common errors.
          
be52af70   tangwang   first commit
319
          Args:
33839b37   tangwang   属性值参与搜索:
320
321
              config: SearchConfig to validate
          
be52af70   tangwang   first commit
322
          Returns:
33839b37   tangwang   属性值参与搜索:
323
              List of error messages (empty if valid)
be52af70   tangwang   first commit
324
325
          """
          errors = []
b926f678   tangwang   多语言查询
326
          
33839b37   tangwang   属性值参与搜索:
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
          # Validate es_index_name
          if not config.es_index_name:
              errors.append("es_index_name is required")
          
          # Validate field_boosts
          if not config.field_boosts:
              errors.append("field_boosts is empty")
          
          for field_name, boost in config.field_boosts.items():
              if not isinstance(boost, (int, float)):
                  errors.append(f"field_boosts['{field_name}']: boost must be a number, got {type(boost).__name__}")
              elif boost < 0:
                  errors.append(f"field_boosts['{field_name}']: boost must be non-negative")
          
          # Validate indexes
          if not config.indexes:
              errors.append("At least one index domain must be defined")
          
          index_names = set()
be52af70   tangwang   first commit
346
          for index in config.indexes:
33839b37   tangwang   属性值参与搜索:
347
348
349
350
              # Check for duplicate index names
              if index.name in index_names:
                  errors.append(f"Duplicate index name: {index.name}")
              index_names.add(index.name)
b926f678   tangwang   多语言查询
351
              
33839b37   tangwang   属性值参与搜索:
352
353
354
355
              # Validate fields in index
              if not index.fields:
                  errors.append(f"Index '{index.name}': fields list is empty")
          
be52af70   tangwang   first commit
356
357
358
359
          # Validate SPU config
          if config.spu_config.enabled:
              if not config.spu_config.spu_field:
                  errors.append("SPU aggregation enabled but no spu_field specified")
33839b37   tangwang   属性值参与搜索:
360
361
362
363
364
365
366
367
368
369
370
          
          # Validate query config
          if not config.query_config.supported_languages:
              errors.append("At least one supported language must be specified")
          
          if config.query_config.default_language not in config.query_config.supported_languages:
              errors.append(
                  f"Default language '{config.query_config.default_language}' "
                  f"not in supported languages: {config.query_config.supported_languages}"
              )
          
be52af70   tangwang   first commit
371
          return errors
33839b37   tangwang   属性值参与搜索:
372
373
374
      
      def to_dict(self, config: SearchConfig) -> Dict[str, Any]:
          """Convert SearchConfig to dictionary representation."""
a77693fe   tangwang   调整配置目录结构
375
          
33839b37   tangwang   属性值参与搜索:
376
          # Build query_config dict
9f96d6f3   tangwang   短query不用语义搜索
377
378
379
          query_config_dict = {
              "supported_languages": config.query_config.supported_languages,
              "default_language": config.query_config.default_language,
9f96d6f3   tangwang   短query不用语义搜索
380
381
382
              "enable_text_embedding": config.query_config.enable_text_embedding,
              "enable_query_rewrite": config.query_config.enable_query_rewrite,
              "translation_service": config.query_config.translation_service,
33839b37   tangwang   属性值参与搜索:
383
384
385
              "text_embedding_field": config.query_config.text_embedding_field,
              "image_embedding_field": config.query_config.image_embedding_field,
              "embedding_disable_thresholds": {
9f96d6f3   tangwang   短query不用语义搜索
386
387
                  "chinese_char_limit": config.query_config.embedding_disable_chinese_char_limit,
                  "english_word_limit": config.query_config.embedding_disable_english_word_limit
33839b37   tangwang   属性值参与搜索:
388
389
390
              },
              "source_fields": config.query_config.source_fields
          }
9f96d6f3   tangwang   短query不用语义搜索
391
          
33839b37   tangwang   属性值参与搜索:
392
          return {
be52af70   tangwang   first commit
393
394
              "es_index_name": config.es_index_name,
              "es_settings": config.es_settings,
33839b37   tangwang   属性值参与搜索:
395
              "field_boosts": config.field_boosts,
be52af70   tangwang   first commit
396
              "indexes": [self._index_to_dict(index) for index in config.indexes],
9f96d6f3   tangwang   短query不用语义搜索
397
              "query_config": query_config_dict,
be52af70   tangwang   first commit
398
399
400
401
              "ranking": {
                  "expression": config.ranking.expression,
                  "description": config.ranking.description
              },
1f6d15fa   tangwang   重构:SPU级别索引、统一索引架构...
402
403
404
405
406
407
              "function_score": {
                  "score_mode": config.function_score.score_mode,
                  "boost_mode": config.function_score.boost_mode,
                  "functions": config.function_score.functions
              },
              "rerank": {
506c39b7   tangwang   feat(search): 统一重...
408
409
410
411
412
                  "rerank_window": config.rerank.rerank_window,
                  "service_url": config.rerank.service_url,
                  "timeout_sec": config.rerank.timeout_sec,
                  "weight_es": config.rerank.weight_es,
                  "weight_ai": config.rerank.weight_ai,
1f6d15fa   tangwang   重构:SPU级别索引、统一索引架构...
413
              },
be52af70   tangwang   first commit
414
415
416
              "spu_config": {
                  "enabled": config.spu_config.enabled,
                  "spu_field": config.spu_config.spu_field,
33839b37   tangwang   属性值参与搜索:
417
418
                  "inner_hits_size": config.spu_config.inner_hits_size,
                  "searchable_option_dimensions": config.spu_config.searchable_option_dimensions
be52af70   tangwang   first commit
419
420
              }
          }
a77693fe   tangwang   调整配置目录结构
421
      
be52af70   tangwang   first commit
422
      def _index_to_dict(self, index: IndexConfig) -> Dict[str, Any]:
33839b37   tangwang   属性值参与搜索:
423
          """Convert IndexConfig to dictionary."""
b926f678   tangwang   多语言查询
424
          result = {
be52af70   tangwang   first commit
425
426
427
              "name": index.name,
              "label": index.label,
              "fields": index.fields,
33839b37   tangwang   属性值参与搜索:
428
              "boost": index.boost
b926f678   tangwang   多语言查询
429
          }
9f96d6f3   tangwang   短query不用语义搜索
430
          
9f96d6f3   tangwang   短query不用语义搜索
431
432
          if index.example:
              result["example"] = index.example
33839b37   tangwang   属性值参与搜索:
433
434
435
          
          return result
  
b926f678   tangwang   多语言查询
436
  
33839b37   tangwang   属性值参与搜索:
437
438
439
440
441
442
443
444
445
446
447
448
  def load_tenant_config(tenant_id: Optional[str] = None) -> SearchConfig:
      """
      Load tenant configuration (backward compatibility wrapper).
      
      Args:
          tenant_id: Ignored (kept for backward compatibility)
      
      Returns:
          SearchConfig loaded from config/config.yaml
      """
      loader = ConfigLoader()
      return loader.load_config()