Blame view

api/translator_app.py 9.75 KB
0fd2f875   tangwang   translate
1
  """Translator service HTTP app."""
768ad710   tangwang   MySQL到ES字段映射说明-业务...
2
  
768ad710   tangwang   MySQL到ES字段映射说明-业务...
3
  import argparse
0fd2f875   tangwang   translate
4
5
6
7
8
  import logging
  from contextlib import asynccontextmanager
  from functools import lru_cache
  from typing import List, Optional, Union
  
768ad710   tangwang   MySQL到ES字段映射说明-业务...
9
  import uvicorn
768ad710   tangwang   MySQL到ES字段映射说明-业务...
10
  from fastapi import FastAPI, HTTPException
768ad710   tangwang   MySQL到ES字段映射说明-业务...
11
  from fastapi.middleware.cors import CORSMiddleware
0fd2f875   tangwang   translate
12
13
  from fastapi.responses import JSONResponse
  from pydantic import BaseModel, ConfigDict, Field
768ad710   tangwang   MySQL到ES字段映射说明-业务...
14
  
d4cadc13   tangwang   翻译重构
15
  from config.services_config import get_translation_config
5e4dc8e4   tangwang   翻译架构按“一个翻译服务 +
16
  from translation.service import TranslationService
0fd2f875   tangwang   translate
17
18
19
20
21
  from translation.settings import (
      get_enabled_translation_models,
      normalize_translation_model,
      normalize_translation_scene,
  )
768ad710   tangwang   MySQL到ES字段映射说明-业务...
22
23
24
25
26
27
28
29
  
  # Configure logging
  logging.basicConfig(
      level=logging.INFO,
      format='%(asctime)s - %(name)s - %(levelname)s - %(message)s'
  )
  logger = logging.getLogger(__name__)
  
768ad710   tangwang   MySQL到ES字段映射说明-业务...
30
  
0fd2f875   tangwang   translate
31
  @lru_cache(maxsize=1)
5e4dc8e4   tangwang   翻译架构按“一个翻译服务 +
32
  def get_translation_service() -> TranslationService:
0fd2f875   tangwang   translate
33
      return TranslationService(get_translation_config())
768ad710   tangwang   MySQL到ES字段映射说明-业务...
34
35
36
37
38
  
  
  # Request/Response models
  class TranslationRequest(BaseModel):
      """Translation request model."""
768ad710   tangwang   MySQL到ES字段映射说明-业务...
39
  
0fd2f875   tangwang   translate
40
41
      model_config = ConfigDict(
          json_schema_extra={
768ad710   tangwang   MySQL到ES字段映射说明-业务...
42
43
44
              "example": {
                  "text": "商品名称",
                  "target_lang": "en",
3cd09b3b   tangwang   翻译接口改为调用qwen-mt-f...
45
                  "source_lang": "zh",
d4cadc13   tangwang   翻译重构
46
                  "model": "llm",
0fd2f875   tangwang   translate
47
                  "scene": "sku_name",
768ad710   tangwang   MySQL到ES字段映射说明-业务...
48
49
              }
          }
0fd2f875   tangwang   translate
50
51
52
53
54
55
56
      )
  
      text: Union[str, List[str]] = Field(..., description="Text to translate (string or list of strings)")
      target_lang: str = Field(..., description="Target language code (zh, en, ru, etc.)")
      source_lang: Optional[str] = Field(None, description="Source language code (optional, auto-detect if not provided)")
      model: Optional[str] = Field(None, description="Enabled translation capability name")
      scene: Optional[str] = Field(None, description="Translation scene, paired with model routing")
768ad710   tangwang   MySQL到ES字段映射说明-业务...
57
58
59
60
  
  
  class TranslationResponse(BaseModel):
      """Translation response model."""
6f7840cf   tangwang   refactor: rename ...
61
      text: Union[str, List[str]] = Field(..., description="Original text (string or list)")
768ad710   tangwang   MySQL到ES字段映射说明-业务...
62
63
      target_lang: str = Field(..., description="Target language code")
      source_lang: Optional[str] = Field(None, description="Source language code (detected or provided)")
6f7840cf   tangwang   refactor: rename ...
64
65
66
67
      translated_text: Union[str, List[Optional[str]]] = Field(
          ...,
          description="Translated text (string or list; list elements may be null on failure)",
      )
768ad710   tangwang   MySQL到ES字段映射说明-业务...
68
      status: str = Field(..., description="Translation status")
3cd09b3b   tangwang   翻译接口改为调用qwen-mt-f...
69
      model: str = Field(..., description="Translation model used")
5e4dc8e4   tangwang   翻译架构按“一个翻译服务 +
70
      scene: str = Field(..., description="Translation scene used")
768ad710   tangwang   MySQL到ES字段映射说明-业务...
71
72
  
  
0fd2f875   tangwang   translate
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
  def _normalize_scene(service: TranslationService, scene: Optional[str]) -> str:
      return normalize_translation_scene(service.config, scene)
  
  
  def _normalize_model(service: TranslationService, model: Optional[str]) -> str:
      return normalize_translation_model(service.config, model or service.config["default_model"])
  
  
  def _ensure_valid_text(text: Union[str, List[str]]) -> None:
      if isinstance(text, list):
          if not text:
              raise HTTPException(status_code=400, detail="Text list cannot be empty")
          return
      if not text or not text.strip():
          raise HTTPException(status_code=400, detail="Text cannot be empty")
  
  
  def _normalize_batch_result(
      original: List[str],
      translated: Union[str, List[Optional[str]], None],
  ) -> List[Optional[str]]:
      if translated is None:
          return [None for _ in original]
      if not isinstance(translated, list):
          raise HTTPException(status_code=500, detail="Batch translation provider returned non-list result")
      return [translated[idx] if idx < len(translated) else None for idx, _ in enumerate(original)]
  
  
  def _translate_batch(
      service: TranslationService,
      raw_text: List[str],
      *,
      target_lang: str,
      source_lang: Optional[str],
      model: str,
      scene: str,
  ) -> List[Optional[str]]:
      backend = service.get_backend(model)
      if getattr(backend, "supports_batch", False):
          try:
              translated = service.translate(
                  text=raw_text,
                  target_lang=target_lang,
                  source_lang=source_lang,
                  model=model,
                  scene=scene,
              )
              return _normalize_batch_result(raw_text, translated)
          except ValueError:
              raise
          except Exception as exc:
              logger.error("Batch translation failed: %s", exc, exc_info=True)
  
      results: List[Optional[str]] = []
      for item in raw_text:
          if item is None or not str(item).strip():
              results.append(item)  # type: ignore[arg-type]
              continue
          try:
              out = service.translate(
                  text=str(item),
                  target_lang=target_lang,
                  source_lang=source_lang,
                  model=model,
                  scene=scene,
              )
          except ValueError:
              raise
          except Exception as exc:
              logger.warning("Per-item translation failed: %s", exc, exc_info=True)
              out = None
          results.append(out)
      return results
  
  
  @asynccontextmanager
  async def lifespan(_: FastAPI):
      """Warm the default backend on process startup."""
      logger.info("Starting Translation Service API")
      service = get_translation_service()
      default_backend = service.get_backend(service.config["default_model"])
      logger.info(
          "Translation service ready | default_model=%s available_models=%s loaded_models=%s",
          service.config["default_model"],
          service.available_models,
          service.loaded_models,
      )
      logger.info(
          "Default translation backend warmed up | model=%s",
          getattr(default_backend, "model", service.config["default_model"]),
      )
      yield
  
  
768ad710   tangwang   MySQL到ES字段映射说明-业务...
167
168
169
  # Create FastAPI app
  app = FastAPI(
      title="Translation Service API",
0fd2f875   tangwang   translate
170
      description="Translation service with pluggable capabilities and scene routing",
768ad710   tangwang   MySQL到ES字段映射说明-业务...
171
172
      version="1.0.0",
      docs_url="/docs",
0fd2f875   tangwang   translate
173
174
      redoc_url="/redoc",
      lifespan=lifespan,
768ad710   tangwang   MySQL到ES字段映射说明-业务...
175
176
177
178
179
180
181
182
183
184
185
186
  )
  
  # Add CORS middleware
  app.add_middleware(
      CORSMiddleware,
      allow_origins=["*"],
      allow_credentials=True,
      allow_methods=["*"],
      allow_headers=["*"],
  )
  
  
768ad710   tangwang   MySQL到ES字段映射说明-业务...
187
188
189
190
  @app.get("/health")
  async def health_check():
      """Health check endpoint."""
      try:
5e4dc8e4   tangwang   翻译架构按“一个翻译服务 +
191
          service = get_translation_service()
768ad710   tangwang   MySQL到ES字段映射说明-业务...
192
193
194
          return {
              "status": "healthy",
              "service": "translation",
0fd2f875   tangwang   translate
195
196
              "default_model": service.config["default_model"],
              "default_scene": service.config["default_scene"],
5e4dc8e4   tangwang   翻译架构按“一个翻译服务 +
197
              "available_models": service.available_models,
0fd2f875   tangwang   translate
198
199
              "enabled_capabilities": get_enabled_translation_models(service.config),
              "loaded_models": service.loaded_models,
768ad710   tangwang   MySQL到ES字段映射说明-业务...
200
201
202
203
204
205
206
207
208
209
210
211
212
213
          }
      except Exception as e:
          logger.error(f"Health check failed: {e}")
          return JSONResponse(
              status_code=503,
              content={
                  "status": "unhealthy",
                  "error": str(e)
              }
          )
  
  
  @app.post("/translate", response_model=TranslationResponse)
  async def translate(request: TranslationRequest):
0fd2f875   tangwang   translate
214
215
      _ensure_valid_text(request.text)
  
768ad710   tangwang   MySQL到ES字段映射说明-业务...
216
      if not request.target_lang:
0fd2f875   tangwang   translate
217
218
          raise HTTPException(status_code=400, detail="target_lang is required")
  
768ad710   tangwang   MySQL到ES字段映射说明-业务...
219
      try:
5e4dc8e4   tangwang   翻译架构按“一个翻译服务 +
220
          service = get_translation_service()
0fd2f875   tangwang   translate
221
222
          scene = _normalize_scene(service, request.scene)
          model = _normalize_model(service, request.model)
5e4dc8e4   tangwang   翻译架构按“一个翻译服务 +
223
          translator = service.get_backend(model)
6f7840cf   tangwang   refactor: rename ...
224
225
          raw_text = request.text
  
6f7840cf   tangwang   refactor: rename ...
226
          if isinstance(raw_text, list):
0fd2f875   tangwang   translate
227
228
229
230
231
232
233
234
              results = _translate_batch(
                  service,
                  raw_text,
                  target_lang=request.target_lang,
                  source_lang=request.source_lang,
                  model=model,
                  scene=scene,
              )
6f7840cf   tangwang   refactor: rename ...
235
236
237
238
239
240
241
              return TranslationResponse(
                  text=raw_text,
                  target_lang=request.target_lang,
                  source_lang=request.source_lang,
                  translated_text=results,
                  status="success",
                  model=str(getattr(translator, "model", model)),
5e4dc8e4   tangwang   翻译架构按“一个翻译服务 +
242
                  scene=scene,
6f7840cf   tangwang   refactor: rename ...
243
244
              )
  
5e4dc8e4   tangwang   翻译架构按“一个翻译服务 +
245
          translated_text = service.translate(
6f7840cf   tangwang   refactor: rename ...
246
              text=raw_text,
768ad710   tangwang   MySQL到ES字段映射说明-业务...
247
248
              target_lang=request.target_lang,
              source_lang=request.source_lang,
5e4dc8e4   tangwang   翻译架构按“一个翻译服务 +
249
250
              model=model,
              scene=scene,
768ad710   tangwang   MySQL到ES字段映射说明-业务...
251
          )
6f7840cf   tangwang   refactor: rename ...
252
  
768ad710   tangwang   MySQL到ES字段映射说明-业务...
253
          if translated_text is None:
0fd2f875   tangwang   translate
254
              raise HTTPException(status_code=500, detail="Translation failed")
6f7840cf   tangwang   refactor: rename ...
255
  
768ad710   tangwang   MySQL到ES字段映射说明-业务...
256
          return TranslationResponse(
6f7840cf   tangwang   refactor: rename ...
257
              text=raw_text,
768ad710   tangwang   MySQL到ES字段映射说明-业务...
258
259
260
              target_lang=request.target_lang,
              source_lang=request.source_lang,
              translated_text=translated_text,
3cd09b3b   tangwang   翻译接口改为调用qwen-mt-f...
261
              status="success",
5e4dc8e4   tangwang   翻译架构按“一个翻译服务 +
262
263
              model=str(getattr(translator, "model", model)),
              scene=scene,
768ad710   tangwang   MySQL到ES字段映射说明-业务...
264
265
266
267
          )
      
      except HTTPException:
          raise
0fd2f875   tangwang   translate
268
269
      except ValueError as e:
          raise HTTPException(status_code=400, detail=str(e)) from e
768ad710   tangwang   MySQL到ES字段映射说明-业务...
270
271
      except Exception as e:
          logger.error(f"Translation error: {e}", exc_info=True)
0fd2f875   tangwang   translate
272
          raise HTTPException(status_code=500, detail=f"Translation error: {str(e)}")
768ad710   tangwang   MySQL到ES字段映射说明-业务...
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
  
  
  @app.get("/")
  async def root():
      """Root endpoint with API information."""
      return {
          "service": "Translation Service API",
          "version": "1.0.0",
          "status": "running",
          "endpoints": {
              "translate": "POST /translate",
              "health": "GET /health",
              "docs": "GET /docs"
          }
      }
  
  
  if __name__ == "__main__":
      parser = argparse.ArgumentParser(description='Start translation API service')
      parser.add_argument('--host', default='0.0.0.0', help='Host to bind to')
      parser.add_argument('--port', type=int, default=6006, help='Port to bind to')
      parser.add_argument('--reload', action='store_true', help='Enable auto-reload')
      args = parser.parse_args()
  
      # Run server
      uvicorn.run(
          "api.translator_app:app",
          host=args.host,
          port=args.port,
          reload=args.reload
      )