Blame view

scripts/test_base.py 7.06 KB
1f6d15fa   tangwang   重构:SPU级别索引、统一索引架构...
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
  #!/usr/bin/env python3
  """
  Test script for base configuration.
  
  Tests data ingestion, search API, response format, and tenant isolation.
  """
  
  import sys
  import os
  import argparse
  import requests
  import json
  from pathlib import Path
  
  # Add parent directory to path
  sys.path.insert(0, str(Path(__file__).parent.parent))
  
  
  def test_search_api(base_url: str, tenant_id: str, query: str = "耳机"):
      """
      Test search API.
  
      Args:
          base_url: API base URL
          tenant_id: Tenant ID
          query: Search query
  
      Returns:
          Response JSON or None if failed
      """
      url = f"{base_url}/search/"
      headers = {
          "X-Tenant-ID": tenant_id,
          "Content-Type": "application/json"
      }
      payload = {
          "query": query,
          "size": 10,
          "from": 0
      }
      
      print(f"\nTesting search API:")
      print(f"  URL: {url}")
      print(f"  Query: {query}")
      print(f"  Tenant ID: {tenant_id}")
      
      try:
          response = requests.post(url, json=payload, headers=headers, timeout=30)
          response.raise_for_status()
          data = response.json()
          
          print(f"  Status: {response.status_code}")
          print(f"  Total: {data.get('total', 0)}")
          print(f"  Results: {len(data.get('results', []))}")
          
          return data
      except Exception as e:
          print(f"  ERROR: {e}")
          return None
  
  
  def validate_response_format(data: dict):
      """
      Validate response format.
  
      Args:
          data: Response data
  
      Returns:
          List of validation errors (empty if valid)
      """
      errors = []
      
      # Check for results field (not hits)
      if 'hits' in data:
          errors.append("Response contains 'hits' field (should be 'results')")
      
      if 'results' not in data:
          errors.append("Response missing 'results' field")
      else:
          results = data['results']
          if not isinstance(results, list):
              errors.append("'results' should be a list")
          else:
              # Validate first result structure
              if results:
                  result = results[0]
cadc77b6   tangwang   索引字段名、变量名、API数据结构...
88
                  required_fields = ['spu_id', 'title', 'skus', 'relevance_score']
1f6d15fa   tangwang   重构:SPU级别索引、统一索引架构...
89
90
91
92
93
94
95
96
97
98
                  for field in required_fields:
                      if field not in result:
                          errors.append(f"Result missing required field: {field}")
                  
                  # Check for ES internal fields
                  es_internal_fields = ['_id', '_score', '_source']
                  for field in es_internal_fields:
                      if field in result:
                          errors.append(f"Result contains ES internal field: {field}")
                  
cadc77b6   tangwang   索引字段名、变量名、API数据结构...
99
100
101
102
103
104
105
106
107
108
109
                  # Validate skus
                  if 'skus' in result:
                      skus = result['skus']
                      if not isinstance(skus, list):
                          errors.append("'skus' should be a list")
                      elif skus:
                          sku = skus[0]
                          sku_required = ['sku_id', 'price', 'sku', 'stock']
                          for field in sku_required:
                              if field not in sku:
                                  errors.append(f"SKU missing required field: {field}")
1f6d15fa   tangwang   重构:SPU级别索引、统一索引架构...
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
      
      # Check for suggestions and related_searches
      if 'suggestions' not in data:
          errors.append("Response missing 'suggestions' field")
      if 'related_searches' not in data:
          errors.append("Response missing 'related_searches' field")
      
      return errors
  
  
  def test_facets(base_url: str, tenant_id: str):
      """
      Test facets aggregation.
  
      Args:
          base_url: API base URL
          tenant_id: Tenant ID
  
      Returns:
          Response JSON or None if failed
      """
      url = f"{base_url}/search/"
      headers = {
          "X-Tenant-ID": tenant_id,
          "Content-Type": "application/json"
      }
      payload = {
          "query": "商品",
          "size": 10,
cadc77b6   tangwang   索引字段名、变量名、API数据结构...
139
          "facets": ["category.keyword", "vendor.keyword"]
1f6d15fa   tangwang   重构:SPU级别索引、统一索引架构...
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
      }
      
      print(f"\nTesting facets:")
      print(f"  Facets: {payload['facets']}")
      
      try:
          response = requests.post(url, json=payload, headers=headers, timeout=30)
          response.raise_for_status()
          data = response.json()
          
          if 'facets' in data and data['facets']:
              print(f"  Facets returned: {len(data['facets'])}")
              for facet in data['facets']:
                  print(f"    - {facet.get('field')}: {len(facet.get('values', []))} values")
          else:
              print("  WARNING: No facets returned")
          
          return data
      except Exception as e:
          print(f"  ERROR: {e}")
          return None
  
  
  def test_tenant_isolation(base_url: str, tenant_id_1: str, tenant_id_2: str):
      """
      Test tenant isolation.
  
      Args:
          base_url: API base URL
          tenant_id_1: First tenant ID
          tenant_id_2: Second tenant ID
      """
      print(f"\nTesting tenant isolation:")
      print(f"  Tenant 1: {tenant_id_1}")
      print(f"  Tenant 2: {tenant_id_2}")
      
      # Search for tenant 1
      data1 = test_search_api(base_url, tenant_id_1, "商品")
      # Search for tenant 2
      data2 = test_search_api(base_url, tenant_id_2, "商品")
      
      if data1 and data2:
cadc77b6   tangwang   索引字段名、变量名、API数据结构...
182
183
          results1 = set(r.get('spu_id') for r in data1.get('results', []))
          results2 = set(r.get('spu_id') for r in data2.get('results', []))
1f6d15fa   tangwang   重构:SPU级别索引、统一索引架构...
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
          
          overlap = results1 & results2
          if overlap:
              print(f"  WARNING: Found {len(overlap)} overlapping results between tenants")
          else:
              print(f"  OK: No overlapping results (tenant isolation working)")
  
  
  def main():
      parser = argparse.ArgumentParser(description='Test base configuration')
      parser.add_argument('--api-url', default='http://localhost:8000', help='API base URL')
      parser.add_argument('--tenant-id', default='1', help='Tenant ID for testing')
      parser.add_argument('--test-tenant-2', help='Second tenant ID for isolation test')
      
      args = parser.parse_args()
      
      print("=" * 60)
      print("Base Configuration Test Suite")
      print("=" * 60)
      
      # Test 1: Basic search
      print("\n[Test 1] Basic Search")
      data = test_search_api(args.api_url, args.tenant_id)
      if not data:
          print("FAILED: Basic search test")
          return 1
      
      # Test 2: Response format validation
      print("\n[Test 2] Response Format Validation")
      errors = validate_response_format(data)
      if errors:
          print("FAILED: Response format validation")
          for error in errors:
              print(f"  - {error}")
          return 1
      else:
          print("PASSED: Response format is correct")
      
      # Test 3: Facets
      print("\n[Test 3] Facets Aggregation")
      facet_data = test_facets(args.api_url, args.tenant_id)
      if not facet_data:
          print("WARNING: Facets test failed (may be expected if no data)")
      
      # Test 4: Tenant isolation (if second tenant provided)
      if args.test_tenant_2:
          print("\n[Test 4] Tenant Isolation")
          test_tenant_isolation(args.api_url, args.tenant_id, args.test_tenant_2)
      
      print("\n" + "=" * 60)
      print("All tests completed")
      print("=" * 60)
      
      return 0
  
  
  if __name__ == '__main__':
      sys.exit(main())