115047ee
tangwang
为一个租户灌入测试数据;实例的启动...
|
1
2
|
#!/usr/bin/env python3
"""
|
a7920e17
tangwang
项目名称和部署路径修改
|
3
|
Simple HTTP server for saas-search frontend.
|
115047ee
tangwang
为一个租户灌入测试数据;实例的启动...
|
4
5
6
7
8
9
|
"""
import http.server
import socketserver
import os
import sys
|
bb3c5ef8
tangwang
灌入数据流程跑通
|
10
11
|
import logging
import time
|
02c40701
tangwang
frontend proxy se...
|
12
13
|
import urllib.request
import urllib.error
|
bb3c5ef8
tangwang
灌入数据流程跑通
|
14
|
from collections import defaultdict, deque
|
362d43b6
tangwang
店匠体系数据的搜索
|
15
16
17
18
19
20
21
|
from pathlib import Path
from dotenv import load_dotenv
# Load .env file
project_root = Path(__file__).parent.parent
load_dotenv(project_root / '.env')
|
bb6420d3
tangwang
前端同源代理后端,避免写死6002...
|
22
23
24
25
|
# Get API_BASE_URL from environment(默认不注入,避免被旧 .env 覆盖同源策略)
# 仅当显式设置 FRONTEND_INJECT_API_BASE_URL=1 时才注入 window.API_BASE_URL。
API_BASE_URL = os.getenv('API_BASE_URL') or None
INJECT_API_BASE_URL = os.getenv('FRONTEND_INJECT_API_BASE_URL', '0') == '1'
|
02c40701
tangwang
frontend proxy se...
|
26
27
|
# Backend proxy target for same-origin API forwarding
BACKEND_PROXY_URL = os.getenv('BACKEND_PROXY_URL', 'http://127.0.0.1:6002').rstrip('/')
|
115047ee
tangwang
为一个租户灌入测试数据;实例的启动...
|
28
29
30
31
32
|
# Change to frontend directory
frontend_dir = os.path.join(os.path.dirname(__file__), '../frontend')
os.chdir(frontend_dir)
|
1852e3e3
tangwang
添加Base配置演示流程和数据库配置
|
33
|
# Get port from environment variable or default
|
bb6420d3
tangwang
前端同源代理后端,避免写死6002...
|
34
|
PORT = int(os.getenv('PORT', 6003))
|
115047ee
tangwang
为一个租户灌入测试数据;实例的启动...
|
35
|
|
bb3c5ef8
tangwang
灌入数据流程跑通
|
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
|
# Configure logging to suppress scanner noise
logging.basicConfig(level=logging.ERROR, format='%(asctime)s - %(levelname)s - %(message)s')
class RateLimitingMixin:
"""Mixin for rate limiting requests by IP address."""
request_counts = defaultdict(deque)
rate_limit = 100 # requests per minute
window = 60 # seconds
@classmethod
def is_rate_limited(cls, ip):
now = time.time()
# Clean old requests
while cls.request_counts[ip] and cls.request_counts[ip][0] < now - cls.window:
cls.request_counts[ip].popleft()
# Check rate limit
if len(cls.request_counts[ip]) > cls.rate_limit:
return True
cls.request_counts[ip].append(now)
return False
class MyHTTPRequestHandler(http.server.SimpleHTTPRequestHandler, RateLimitingMixin):
"""Custom request handler with CORS support and robust error handling."""
|
02c40701
tangwang
frontend proxy se...
|
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
|
def _is_proxy_path(self, path: str) -> bool:
"""Return True for API paths that should be forwarded to backend service."""
return path.startswith('/search/') or path.startswith('/admin/') or path.startswith('/indexer/')
def _proxy_to_backend(self):
"""Proxy current request to backend service on the GPU server."""
target_url = f"{BACKEND_PROXY_URL}{self.path}"
method = self.command.upper()
try:
content_length = int(self.headers.get('Content-Length', '0'))
except ValueError:
content_length = 0
body = self.rfile.read(content_length) if content_length > 0 else None
forward_headers = {}
for key, value in self.headers.items():
lk = key.lower()
if lk in ('host', 'content-length', 'connection'):
continue
forward_headers[key] = value
req = urllib.request.Request(
target_url,
data=body,
headers=forward_headers,
method=method,
)
try:
with urllib.request.urlopen(req, timeout=30) as resp:
resp_body = resp.read()
self.send_response(resp.getcode())
for header, value in resp.getheaders():
lh = header.lower()
if lh in ('transfer-encoding', 'connection', 'content-length'):
continue
self.send_header(header, value)
self.end_headers()
self.wfile.write(resp_body)
except urllib.error.HTTPError as e:
err_body = e.read() if hasattr(e, 'read') else b''
self.send_response(e.code)
if e.headers:
for header, value in e.headers.items():
lh = header.lower()
if lh in ('transfer-encoding', 'connection', 'content-length'):
continue
self.send_header(header, value)
self.end_headers()
if err_body:
self.wfile.write(err_body)
except Exception as e:
logging.error(f"Backend proxy error for {method} {self.path}: {e}")
self.send_response(502)
self.send_header('Content-Type', 'application/json; charset=utf-8')
self.end_headers()
self.wfile.write(b'{"error":"Bad Gateway: backend proxy failed"}')
|
1852e3e3
tangwang
添加Base配置演示流程和数据库配置
|
122
|
def do_GET(self):
|
bb6420d3
tangwang
前端同源代理后端,避免写死6002...
|
123
|
"""Handle GET requests with API config injection."""
|
362d43b6
tangwang
店匠体系数据的搜索
|
124
|
path = self.path.split('?')[0]
|
02c40701
tangwang
frontend proxy se...
|
125
126
127
128
129
|
# Proxy API paths to backend first
if self._is_proxy_path(path):
self._proxy_to_backend()
return
|
bb6420d3
tangwang
前端同源代理后端,避免写死6002...
|
130
|
|
362d43b6
tangwang
店匠体系数据的搜索
|
131
132
|
# Route / to index.html
if path == '/' or path == '':
|
4d824a77
tangwang
所有租户共用一套统一配置.tena...
|
133
|
self.path = '/index.html' + (self.path.split('?', 1)[1] if '?' in self.path else '')
|
bb6420d3
tangwang
前端同源代理后端,避免写死6002...
|
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
|
# Inject API config for HTML files
if self.path.endswith('.html'):
self._serve_html_with_config()
else:
super().do_GET()
def _serve_html_with_config(self):
"""Serve HTML with optional API_BASE_URL injected."""
try:
file_path = self.path.lstrip('/')
if not os.path.exists(file_path):
self.send_error(404)
return
with open(file_path, 'r', encoding='utf-8') as f:
html = f.read()
# 默认不注入 API_BASE_URL,避免历史 .env(如 http://xx:6002)覆盖同源调用。
# 仅当 FRONTEND_INJECT_API_BASE_URL=1 且 API_BASE_URL 有值时才注入。
if INJECT_API_BASE_URL and API_BASE_URL:
config_script = f'<script>window.API_BASE_URL="{API_BASE_URL}";</script>\n '
html = html.replace('<script src="/static/js/app.js', config_script + '<script src="/static/js/app.js', 1)
self.send_response(200)
self.send_header('Content-Type', 'text/html; charset=utf-8')
self.end_headers()
self.wfile.write(html.encode('utf-8'))
except Exception as e:
logging.error(f"Error serving HTML: {e}")
self.send_error(500)
|
02c40701
tangwang
frontend proxy se...
|
165
166
167
168
169
170
171
172
|
def do_POST(self):
"""Handle POST requests. Proxy API requests to backend."""
path = self.path.split('?')[0]
if self._is_proxy_path(path):
self._proxy_to_backend()
return
self.send_error(405, "Method Not Allowed")
|
1852e3e3
tangwang
添加Base配置演示流程和数据库配置
|
173
|
|
bb3c5ef8
tangwang
灌入数据流程跑通
|
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
|
def setup(self):
"""Setup with error handling."""
try:
super().setup()
except Exception:
pass # Silently handle setup errors from scanners
def handle_one_request(self):
"""Handle single request with error catching."""
try:
# Check rate limiting
client_ip = self.client_address[0]
if self.is_rate_limited(client_ip):
logging.warning(f"Rate limiting IP: {client_ip}")
self.send_error(429, "Too Many Requests")
return
super().handle_one_request()
except (ConnectionResetError, BrokenPipeError):
# Client disconnected prematurely - common with scanners
pass
except UnicodeDecodeError:
# Binary data received - not HTTP
pass
except Exception as e:
# Log unexpected errors but don't crash
logging.debug(f"Request handling error: {e}")
def log_message(self, format, *args):
"""Suppress logging for malformed requests from scanners."""
message = format % args
# Filter out scanner noise
noise_patterns = [
"code 400",
"Bad request",
"Bad request version",
"Bad HTTP/0.9 request type",
"Bad request syntax"
]
if any(pattern in message for pattern in noise_patterns):
return
# Only log legitimate requests
if message and not message.startswith(" ") and len(message) > 10:
super().log_message(format, *args)
|
115047ee
tangwang
为一个租户灌入测试数据;实例的启动...
|
218
219
220
221
222
223
|
def end_headers(self):
# Add CORS headers
self.send_header('Access-Control-Allow-Origin', '*')
self.send_header('Access-Control-Allow-Methods', 'GET, POST, OPTIONS')
self.send_header('Access-Control-Allow-Headers', 'Content-Type')
|
bb3c5ef8
tangwang
灌入数据流程跑通
|
224
225
226
227
|
# Add security headers
self.send_header('X-Content-Type-Options', 'nosniff')
self.send_header('X-Frame-Options', 'DENY')
self.send_header('X-XSS-Protection', '1; mode=block')
|
115047ee
tangwang
为一个租户灌入测试数据;实例的启动...
|
228
229
230
|
super().end_headers()
def do_OPTIONS(self):
|
bb3c5ef8
tangwang
灌入数据流程跑通
|
231
232
|
"""Handle OPTIONS requests."""
try:
|
02c40701
tangwang
frontend proxy se...
|
233
234
235
236
237
|
path = self.path.split('?')[0]
if self._is_proxy_path(path):
self.send_response(204)
self.end_headers()
return
|
bb3c5ef8
tangwang
灌入数据流程跑通
|
238
239
240
241
242
243
244
245
246
|
self.send_response(200)
self.end_headers()
except Exception:
pass
class ThreadedTCPServer(socketserver.ThreadingMixIn, socketserver.TCPServer):
"""Threaded TCP server with better error handling."""
allow_reuse_address = True
daemon_threads = True
|
115047ee
tangwang
为一个租户灌入测试数据;实例的启动...
|
247
248
|
if __name__ == '__main__':
|
4d824a77
tangwang
所有租户共用一套统一配置.tena...
|
249
250
251
252
253
254
255
256
257
258
259
260
|
# Check if port is already in use
import socket
sock = socket.socket(socket.AF_INET, socket.SOCK_STREAM)
try:
sock.bind(("", PORT))
sock.close()
except OSError:
print(f"ERROR: Port {PORT} is already in use.")
print(f"Please stop the existing server or use a different port.")
print(f"To stop existing server: kill $(lsof -t -i:{PORT})")
sys.exit(1)
|
bb3c5ef8
tangwang
灌入数据流程跑通
|
261
262
|
# Create threaded server for better concurrency
with ThreadedTCPServer(("", PORT), MyHTTPRequestHandler) as httpd:
|
115047ee
tangwang
为一个租户灌入测试数据;实例的启动...
|
263
264
265
|
print(f"Frontend server started at http://localhost:{PORT}")
print(f"Serving files from: {os.getcwd()}")
print("\nPress Ctrl+C to stop the server")
|
bb3c5ef8
tangwang
灌入数据流程跑通
|
266
|
|
115047ee
tangwang
为一个租户灌入测试数据;实例的启动...
|
267
268
269
|
try:
httpd.serve_forever()
except KeyboardInterrupt:
|
bb3c5ef8
tangwang
灌入数据流程跑通
|
270
271
272
|
print("\nShutting down server...")
httpd.shutdown()
print("Server stopped")
|
115047ee
tangwang
为一个租户灌入测试数据;实例的启动...
|
273
|
sys.exit(0)
|
bb3c5ef8
tangwang
灌入数据流程跑通
|
274
275
276
|
except Exception as e:
print(f"Server error: {e}")
sys.exit(1)
|