sycommon-python-lib 0.1.55b1__py3-none-any.whl → 0.1.56__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (48) hide show
  1. sycommon/config/Config.py +29 -4
  2. sycommon/config/LangfuseConfig.py +15 -0
  3. sycommon/config/RerankerConfig.py +1 -0
  4. sycommon/config/SentryConfig.py +13 -0
  5. sycommon/llm/__init__.py +0 -0
  6. sycommon/llm/embedding.py +204 -0
  7. sycommon/llm/get_llm.py +37 -0
  8. sycommon/llm/llm_logger.py +126 -0
  9. sycommon/llm/llm_tokens.py +119 -0
  10. sycommon/llm/struct_token.py +192 -0
  11. sycommon/llm/sy_langfuse.py +103 -0
  12. sycommon/llm/usage_token.py +117 -0
  13. sycommon/logging/kafka_log.py +200 -434
  14. sycommon/logging/logger_levels.py +23 -0
  15. sycommon/middleware/context.py +2 -0
  16. sycommon/middleware/exception.py +10 -16
  17. sycommon/middleware/timeout.py +2 -1
  18. sycommon/middleware/traceid.py +174 -48
  19. sycommon/notice/__init__.py +0 -0
  20. sycommon/notice/uvicorn_monitor.py +200 -0
  21. sycommon/rabbitmq/rabbitmq_client.py +232 -242
  22. sycommon/rabbitmq/rabbitmq_pool.py +278 -218
  23. sycommon/rabbitmq/rabbitmq_service.py +25 -843
  24. sycommon/rabbitmq/rabbitmq_service_client_manager.py +206 -0
  25. sycommon/rabbitmq/rabbitmq_service_connection_monitor.py +73 -0
  26. sycommon/rabbitmq/rabbitmq_service_consumer_manager.py +285 -0
  27. sycommon/rabbitmq/rabbitmq_service_core.py +117 -0
  28. sycommon/rabbitmq/rabbitmq_service_producer_manager.py +238 -0
  29. sycommon/sentry/__init__.py +0 -0
  30. sycommon/sentry/sy_sentry.py +35 -0
  31. sycommon/services.py +124 -96
  32. sycommon/synacos/feign.py +8 -3
  33. sycommon/synacos/feign_client.py +22 -8
  34. sycommon/synacos/nacos_client_base.py +119 -0
  35. sycommon/synacos/nacos_config_manager.py +107 -0
  36. sycommon/synacos/nacos_heartbeat_manager.py +144 -0
  37. sycommon/synacos/nacos_service.py +64 -771
  38. sycommon/synacos/nacos_service_discovery.py +157 -0
  39. sycommon/synacos/nacos_service_registration.py +270 -0
  40. sycommon/tools/env.py +62 -0
  41. sycommon/tools/merge_headers.py +117 -0
  42. sycommon/tools/snowflake.py +101 -153
  43. {sycommon_python_lib-0.1.55b1.dist-info → sycommon_python_lib-0.1.56.dist-info}/METADATA +11 -5
  44. sycommon_python_lib-0.1.56.dist-info/RECORD +89 -0
  45. sycommon_python_lib-0.1.55b1.dist-info/RECORD +0 -62
  46. {sycommon_python_lib-0.1.55b1.dist-info → sycommon_python_lib-0.1.56.dist-info}/WHEEL +0 -0
  47. {sycommon_python_lib-0.1.55b1.dist-info → sycommon_python_lib-0.1.56.dist-info}/entry_points.txt +0 -0
  48. {sycommon_python_lib-0.1.55b1.dist-info → sycommon_python_lib-0.1.56.dist-info}/top_level.txt +0 -0
@@ -1,21 +1,19 @@
1
- import logging
2
1
  import threading
3
- import json
4
- from typing import Callable, Dict, List, Optional
5
- import nacos
6
2
  import socket
7
3
  import signal
8
4
  import sys
9
5
  import os
10
- import yaml
11
6
  import time
12
- import atexit
13
- import random
14
-
15
- from sycommon.config.Config import SingletonMeta
7
+ from typing import Callable, Dict, List, Optional
8
+ from sycommon.config.Config import Config, SingletonMeta
16
9
  from sycommon.logging.kafka_log import SYLogger
17
10
 
18
- logging.getLogger("nacos.client").setLevel(logging.WARNING)
11
+ from sycommon.synacos.nacos_client_base import NacosClientBase
12
+ from sycommon.synacos.nacos_service_registration import NacosServiceRegistration
13
+ from sycommon.synacos.nacos_heartbeat_manager import NacosHeartbeatManager
14
+ from sycommon.synacos.nacos_config_manager import NacosConfigManager
15
+ from sycommon.synacos.nacos_service_discovery import NacosServiceDiscovery
16
+ from sycommon.tools.env import check_env_flag, get_env_var
19
17
 
20
18
 
21
19
  class NacosService(metaclass=SingletonMeta):
@@ -26,408 +24,65 @@ class NacosService(metaclass=SingletonMeta):
26
24
  self.service_name = config['Name']
27
25
  self.host = config['Host']
28
26
  self.port = config['Port']
29
- self.version = os.getenv('VERSION')
30
- self.enable_register_nacos = os.getenv(
31
- 'REGISTER-NACOS', 'true').lower() == 'true'
32
- self.registered = False
33
- self._client_initialized = False # 客户端初始化状态
34
- self._shutdown_event = threading.Event()
35
-
36
- # 添加可重入锁用于状态同步
37
- self._state_lock = threading.RLock()
38
-
39
- # 配置参数
40
- self.max_retries = self.nacos_config.get('maxRetries', 5)
41
- self.retry_delay = self.nacos_config.get('retryDelay', 5)
42
- self.max_retry_delay = self.nacos_config.get('maxRetryDelay', 30)
43
- # 心跳间隔:优先从配置读取,默认15秒(可通过配置修改)
44
- self.heartbeat_interval = self.nacos_config.get(
45
- 'heartbeatInterval', 15)
46
- # 心跳超时:固定设置为10秒(需求指定)
47
- self.heartbeat_timeout = 15
48
- self.register_retry_interval = self.nacos_config.get(
49
- 'registerRetryInterval', 15) # 注册重试间隔
50
-
51
- # 长期重试配置
52
- self.long_term_retry_delay = self.nacos_config.get(
53
- 'longTermRetryDelay', 30)
54
- self.max_long_term_retries = self.nacos_config.get(
55
- 'maxLongTermRetries', -1) # -1表示无限重试
27
+ self.version = get_env_var('VERSION')
28
+ self.enable_register_nacos = check_env_flag(
29
+ ['REGISTER-NACOS'], 'true')
56
30
 
57
- # 注册验证配置:优化默认值(增加次数+延长间隔)
58
- self.registration_verify_count = self.nacos_config.get(
59
- 'registrationVerifyCount', 1) # 验证次数
60
- self.registration_verify_interval = self.nacos_config.get(
61
- 'registrationVerifyInterval', 1) # 验证间隔
62
- self.registration_post_delay = self.nacos_config.get(
63
- 'registrationPostDelay', 3) # 注册后延迟3秒再开始验证
31
+ # 初始化基础模块
32
+ self.client_base = NacosClientBase(
33
+ self.nacos_config, self.enable_register_nacos)
64
34
 
35
+ # 获取真实IP
65
36
  self.real_ip = self.get_service_ip(self.host)
66
- self._long_term_retry_count = 0 # 长期重试计数器
67
37
 
68
- # 轮询索引,用于在所有实例中进行轮询选择
69
- self._round_robin_index = 0
70
- self._round_robin_lock = threading.Lock() # 保护轮询索引的线程安全
38
+ # 初始化各功能模块
39
+ self.registration = NacosServiceRegistration(
40
+ self.client_base, self.service_name, self.real_ip, self.port, self.version
41
+ )
42
+ self.config_manager = NacosConfigManager(self.client_base)
43
+ self.discovery = NacosServiceDiscovery(self.client_base)
44
+
45
+ # 心跳间隔配置
46
+ self.heartbeat_interval = self.nacos_config.get(
47
+ 'heartbeatInterval', 15)
48
+ self.heartbeat_manager = NacosHeartbeatManager(
49
+ self.client_base, self.registration, self.heartbeat_interval
50
+ )
71
51
 
72
52
  if self.enable_register_nacos:
73
- # 初始化客户端(仅在首次调用时执行)
74
- self._initialize_client()
75
- # 启动时清理残留实例
76
- self._cleanup_stale_instance()
53
+ # 初始化客户端
54
+ self.client_base._initialize_client()
55
+ # 清理残留实例
56
+ self.registration._cleanup_stale_instance()
77
57
  else:
78
58
  SYLogger.info("nacos:本地开发模式,不初始化Nacos客户端")
79
59
 
80
- self.share_configs = self.read_configs()
81
-
82
- # 配置监听器
83
- self._config_listeners = {}
84
- self._config_cache = {}
85
-
86
- # 心跳相关
87
- self._last_heartbeat_time = 0
88
- self._heartbeat_fail_count = 0
89
- self._heartbeat_lock = threading.Lock()
90
- self._heartbeat_thread = None
91
-
92
- self.max_heartbeat_timeout = self.nacos_config.get(
93
- 'maxHeartbeatTimeout', 30)
94
- self._last_successful_heartbeat = time.time()
95
- # 连接监控检查间隔(新增配置,默认30秒,避免硬编码)
96
- self.connection_check_interval = self.nacos_config.get(
97
- 'connectionCheckInterval', 30)
98
- # 配置监视线程检查间隔(默认30秒)
99
- self.config_watch_interval = self.nacos_config.get(
100
- 'configWatchInterval', 30)
60
+ # 读取配置并设置到全局配置
61
+ self.share_configs = self.config_manager.read_configs(
62
+ self.nacos_config.get('sharedConfigs', []))
63
+ Config().set_attr(self.share_configs)
101
64
 
102
65
  # 启动配置监视线程
103
- self._watch_thread = threading.Thread(
104
- target=self._watch_configs, daemon=True)
105
- self._watch_thread.start()
66
+ self.config_manager.start_watch_configs()
106
67
 
107
- # 仅在需要注册时启动心跳和监控线程
68
+ # 仅在需要注册时启动心跳
108
69
  if self.enable_register_nacos:
109
- # 启动心跳线程
110
- self.start_heartbeat()
70
+ self.heartbeat_manager.start_heartbeat()
111
71
  else:
112
72
  SYLogger.info("nacos:本地开发模式,不启动心跳和监控线程")
113
73
 
114
- def _initialize_client(self):
115
- """初始化Nacos客户端(仅首次调用时执行)"""
116
- if self._client_initialized:
117
- return True
118
-
119
- for attempt in range(self.max_retries):
120
- try:
121
- register_ip = self.nacos_config['registerIp']
122
- namespace_id = self.nacos_config['namespaceId']
123
- self.nacos_client = nacos.NacosClient(
124
- server_addresses=register_ip,
125
- namespace=namespace_id
126
- )
127
- SYLogger.info("nacos:客户端初始化成功")
128
- self._client_initialized = True
129
- return True
130
- except Exception as e:
131
- delay = min(self.retry_delay, self.max_retry_delay)
132
- SYLogger.error(
133
- f"nacos:客户端初始化失败 (尝试 {attempt+1}/{self.max_retries}): {e}")
134
- time.sleep(delay)
135
-
136
- SYLogger.warning("nacos:无法连接到 Nacos 服务器,已达到最大重试次数")
137
- return False
138
-
139
- def _cleanup_stale_instance(self):
140
- """清理可能存在的残留实例"""
141
- if not self._client_initialized:
142
- return
143
-
144
- try:
145
- self.nacos_client.remove_naming_instance(
146
- service_name=self.service_name,
147
- ip=self.real_ip,
148
- port=int(self.port),
149
- cluster_name="DEFAULT"
150
- )
151
- SYLogger.warning(f"nacos:清理残留实例: {self.real_ip}:{self.port}")
152
- except Exception as e:
153
- SYLogger.error(f"nacos:清理残留实例异常: {e}")
154
-
155
- def ensure_client_connected(self, retry_once=False):
156
- """确保Nacos客户端已连接,返回连接状态"""
157
- # 使用线程锁保护客户端初始化状态
158
- with self._state_lock:
159
- if self._client_initialized:
160
- return True
161
-
162
- SYLogger.warning("nacos:客户端未初始化,尝试连接...")
163
-
164
- # 记录尝试次数,避免无限循环
165
- attempt = 0
166
- max_attempts = 2 if retry_once else self.max_retries
167
-
168
- while attempt < max_attempts:
169
- try:
170
- register_ip = self.nacos_config['registerIp']
171
- namespace_id = self.nacos_config['namespaceId']
172
-
173
- # 创建新的Nacos客户端实例
174
- self.nacos_client = nacos.NacosClient(
175
- server_addresses=register_ip,
176
- namespace=namespace_id
177
- )
178
-
179
- # 验证客户端是否真正可用
180
- connection_valid = self._verify_client_connection()
181
-
182
- if connection_valid:
183
- self._client_initialized = True
184
- SYLogger.info("nacos:客户端初始化成功")
185
-
186
- # 客户端重新连接后,检查服务注册状态
187
- self.registered = self.check_service_registered()
188
- return True
189
- else:
190
- raise ConnectionError("nacos:客户端初始化后无法验证连接")
191
-
192
- except Exception as e:
193
- attempt += 1
194
- delay = min(self.retry_delay, self.max_retry_delay)
195
-
196
- SYLogger.error(
197
- f"nacos:客户端初始化失败 (尝试 {attempt}/{max_attempts}): {e}")
198
- time.sleep(delay)
199
-
200
- SYLogger.error("nacos:无法连接到 Nacos 服务器,已达到最大重试次数")
201
- return False
202
-
203
- def _verify_client_connection(self):
204
- """验证客户端是否真正连接成功"""
205
- # 本地开发模式下直接返回True,不进行实际验证
206
- if not self.enable_register_nacos:
207
- return True
208
-
209
- try:
210
- # 使用当前服务的命名实例查询来验证连接
211
- namespace_id = self.nacos_config['namespaceId']
212
- self.nacos_client.list_naming_instance(
213
- service_name=self.service_name,
214
- namespace_id=namespace_id,
215
- group_name="DEFAULT_GROUP",
216
- healthy_only=True
217
- )
218
- return True
219
- except Exception as e:
220
- SYLogger.warning(f"nacos:客户端连接验证失败: {e}")
221
- return False
222
-
223
- def check_service_registered(self):
224
- """检查服务是否已注册(基于实例列表)"""
225
- # 本地开发模式下直接返回True,模拟已注册状态
226
- if not self.enable_register_nacos:
227
- return True
228
-
229
- if not self.ensure_client_connected():
230
- return False
231
-
232
- try:
233
- namespace_id = self.nacos_config['namespaceId']
234
- instances = self.nacos_client.list_naming_instance(
235
- service_name=self.service_name,
236
- namespace_id=namespace_id,
237
- group_name="DEFAULT_GROUP",
238
- healthy_only=True,
239
- )
240
-
241
- # 检查是否存在包含当前IP和端口的实例
242
- found = False
243
- for instance in instances.get('hosts', []):
244
- if (instance.get('ip') == self.real_ip and
245
- instance.get('port') == int(self.port)):
246
- SYLogger.info(f"nacos:找到已注册实例: {self.real_ip}:{self.port}")
247
- found = True
248
- break
249
-
250
- if not found:
251
- SYLogger.warning(f"nacos:未找到注册实例: {self.real_ip}:{self.port}")
252
-
253
- # 带锁更新注册状态
254
- with self._state_lock:
255
- self.registered = found
256
-
257
- return found
258
- except Exception as e:
259
- SYLogger.error(f"nacos:检查服务注册状态失败: {e}")
260
- return False
261
-
262
- def verify_registration(self):
263
- """多次验证服务是否成功注册"""
264
- success_count = 0
265
- SYLogger.info(
266
- f"nacos:开始验证服务注册状态,共验证 {self.registration_verify_count} 次")
267
-
268
- for i in range(self.registration_verify_count):
269
- if self.check_service_registered():
270
- success_count += 1
271
- else:
272
- SYLogger.warning(f"nacos:第 {i+1} 次验证未找到注册实例")
273
-
274
- if i < self.registration_verify_count - 1:
275
- time.sleep(self.registration_verify_interval)
276
-
277
- if success_count >= self.registration_verify_count / 2:
278
- SYLogger.info(
279
- f"nacos:服务注册验证成功,{success_count}/{self.registration_verify_count} 次验证通过")
280
- return True
281
- else:
282
- SYLogger.error(
283
- f"nacos:服务注册验证失败,仅 {success_count}/{self.registration_verify_count} 次验证通过")
284
- return False
285
-
286
- def register_with_retry(self):
287
- """带重试机制的服务注册(基于实例列表检查)"""
288
- retry_count = 0
289
- last_error = None
290
-
291
- # 带锁重置注册状态
292
- with self._state_lock:
293
- self.registered = False
294
-
295
- while (not self.registered) and (self.max_long_term_retries < 0 or retry_count < self.max_long_term_retries):
296
- # 增加状态检查点,防止重复注册
297
- with self._state_lock:
298
- if self.registered:
299
- return True
300
-
301
- try:
302
- # 尝试注册服务
303
- register_success = self.register(force=True)
304
-
305
- if not register_success:
306
- raise RuntimeError("nacos:服务注册请求失败")
307
-
308
- # 关键优化1:注册请求发送后,延迟一段时间再验证(默认3秒)
309
- SYLogger.info(
310
- f"nacos:服务注册请求已发送,延迟 {self.registration_post_delay} 秒后开始验证(确保Nacos服务器完成实例写入)")
311
- time.sleep(self.registration_post_delay)
312
-
313
- # 关键优化2:多次验证服务是否真正注册成功(默认3次,每次间隔2秒)
314
- registered = self.verify_registration()
315
-
316
- # 带锁更新注册状态
317
- with self._state_lock:
318
- self.registered = registered
319
-
320
- # 再次检查状态,防止其他线程修改
321
- with self._state_lock:
322
- if self.registered:
323
- # 注册成功后,更新客户端状态
324
- self._client_initialized = True
325
-
326
- # 注册成功后,通知心跳线程立即发送心跳
327
- self._shutdown_event.set()
328
- self._shutdown_event.clear()
329
-
330
- # 注册成功后,更新监控线程的状态
331
- self._long_term_retry_count = 0
332
-
333
- SYLogger.info(
334
- f"nacos:服务注册成功并通过验证: {self.service_name}")
335
- return True
336
- else:
337
- raise RuntimeError("nacos:服务注册验证失败")
338
-
339
- except Exception as e:
340
- last_error = str(e)
341
- retry_count += 1
342
- delay = min(self.register_retry_interval, self.max_retry_delay)
343
-
344
- SYLogger.warning(
345
- f"nacos:服务注册尝试 {retry_count} 失败: {last_error},{delay}秒后重试")
346
- time.sleep(delay)
347
-
348
- # 最终检查,防止在最后一次重试后其他线程成功注册
349
- with self._state_lock:
350
- if self.registered:
351
- return True
352
-
353
- # 确实注册失败
354
- if last_error:
355
- SYLogger.error(f"nacos:服务注册失败,最终错误: {last_error}")
356
- else:
357
- SYLogger.error(f"nacos:服务注册失败,已达到最大重试次数: {self.service_name}")
358
-
359
- return False
360
-
361
- def register(self, force=False):
362
- """注册服务到Nacos"""
363
- # 使用状态锁保护注册状态
364
- with self._state_lock:
365
- if self.registered and not force and self.check_service_registered():
366
- return True
367
-
368
- if self.registered and not force:
369
- self.registered = False
370
- SYLogger.warning("nacos:本地状态显示已注册,但Nacos中未找到服务实例,准备重新注册")
371
-
372
- metadata = {
373
- "ignore-metrics": "true",
374
- # "preserved.heart.beat.interval": "3000", # 心跳间隔 3 秒
375
- # "preserved.heart.beat.timeout": "15000", # 心跳超时 15 秒
376
- # "preserved.ip.delete.timeout": "30000" # 实例删除超时 30 秒
377
- }
378
- if self.version:
379
- metadata["version"] = self.version
380
-
381
- for attempt in range(self.max_retries):
382
- if not self.ensure_client_connected():
383
- return False
384
-
385
- try:
386
- # 注册服务
387
- self.nacos_client.add_naming_instance(
388
- service_name=self.service_name,
389
- ip=self.real_ip,
390
- port=int(self.port),
391
- metadata=metadata,
392
- cluster_name="DEFAULT",
393
- healthy=True,
394
- ephemeral=True,
395
- heartbeat_interval=self.heartbeat_interval
396
- )
397
- SYLogger.info(
398
- f"nacos:服务 {self.service_name} 注册请求已发送: {self.real_ip}:{self.port}")
399
-
400
- # 注册退出时的清理函数
401
- if not hasattr(self, '_atexit_registered') or not self._atexit_registered:
402
- atexit.register(self.deregister_service)
403
- self._atexit_registered = True
404
-
405
- return True
406
- except Exception as e:
407
- if "signal only works in main thread" in str(e):
408
- return True
409
- elif attempt < self.max_retries - 1:
410
- SYLogger.warning(
411
- f"nacos:服务注册失败 (尝试 {attempt+1}/{self.max_retries}): {e}")
412
- time.sleep(self.retry_delay)
413
- else:
414
- SYLogger.error(f"nacos:服务注册失败,已达到最大重试次数: {e}")
415
- return False
416
-
417
74
  @staticmethod
418
75
  def setup_nacos(config: dict):
419
- """创建并初始化Nacos管理器"""
76
+ """创建并初始化Nacos管理器(保持原有接口)"""
420
77
  instance = NacosService(config)
421
78
 
422
- # 仅在需要注册时执行注册逻辑
423
79
  if instance.enable_register_nacos:
424
- # 使用带超时的等待机制,而不是单次尝试
425
- timeout = 60 # 60秒超时
80
+ # 启动注册线程
81
+ timeout = 60
426
82
  start_time = time.time()
427
83
 
428
- # 启动注册线程,不阻塞主线程(替换原线程池)
429
84
  register_thread = threading.Thread(
430
- target=instance.register_with_retry,
85
+ target=instance.registration.register_with_retry,
431
86
  daemon=True,
432
87
  name="NacosRegisterThread"
433
88
  )
@@ -435,244 +90,38 @@ class NacosService(metaclass=SingletonMeta):
435
90
 
436
91
  # 等待注册完成或超时
437
92
  while True:
438
- # 带锁检查状态
439
- with instance._state_lock:
440
- if instance.registered:
441
- break
93
+ if instance.registration.registered:
94
+ break
442
95
 
443
96
  if time.time() - start_time >= timeout:
444
- # 超时处理
445
97
  break
446
98
 
447
99
  time.sleep(1)
448
100
 
449
101
  # 最终状态检查
450
- with instance._state_lock:
451
- if not instance.registered:
452
- # 清理并抛出异常
453
- try:
454
- instance.deregister_service()
455
- except Exception as e:
456
- SYLogger.error(f"nacos:服务注册失败后,注销服务时发生错误: {e}")
457
- raise RuntimeError("nacos:服务注册失败,应用启动终止")
102
+ if not instance.registration.registered:
103
+ try:
104
+ instance.registration.deregister_service()
105
+ except Exception as e:
106
+ SYLogger.error(f"nacos:服务注册失败后,注销服务时发生错误: {e}")
107
+ raise RuntimeError("nacos:服务注册失败,应用启动终止")
458
108
 
459
- # 服务注册成功后再注册信号处理
109
+ # 注册信号处理
460
110
  signal.signal(signal.SIGTERM, instance.handle_signal)
461
111
  signal.signal(signal.SIGINT, instance.handle_signal)
462
112
 
463
113
  # 启动连接监控线程
464
- threading.Thread(target=instance.monitor_connection,
465
- daemon=True, name="NacosConnectionMonitorThread").start()
114
+ threading.Thread(target=instance.discovery.monitor_connection,
115
+ args=(instance.registration,),
116
+ daemon=True,
117
+ name="NacosConnectionMonitorThread").start()
466
118
  else:
467
119
  SYLogger.info("nacos:本地开发模式,跳过服务注册流程")
468
120
 
469
121
  return instance
470
122
 
471
- def start_heartbeat(self):
472
- """启动心跳线程(确保单例)"""
473
- with self._heartbeat_lock: # 加锁确保线程安全
474
- # 双重检查:先判断线程是否已存在且存活
475
- if self._heartbeat_thread is not None and self._heartbeat_thread.is_alive():
476
- return
477
-
478
- # 彻底清理可能的残留线程引用
479
- self._heartbeat_thread = None
480
-
481
- # 创建新的心跳线程
482
- self._heartbeat_thread = threading.Thread(
483
- target=self._send_heartbeat_loop,
484
- name="NacosHeartbeatThread",
485
- daemon=True
486
- )
487
- self._heartbeat_thread.daemon = True
488
- self._heartbeat_thread.start()
489
- SYLogger.info(
490
- f"nacos:心跳线程启动,线程ID: {self._heartbeat_thread.ident},"
491
- f"心跳间隔: {self.heartbeat_interval}秒,"
492
- f"心跳超时: {self.heartbeat_timeout}秒"
493
- )
494
-
495
- def _send_heartbeat_loop(self):
496
- """优化后的心跳发送循环,确保严格按间隔执行"""
497
- current_thread = threading.current_thread()
498
- thread_ident = current_thread.ident
499
- SYLogger.info(
500
- f"nacos:心跳循环启动 - 线程ID: {thread_ident}, "
501
- f"配置间隔: {self.heartbeat_interval}秒, "
502
- f"超时时间: {self.heartbeat_timeout}秒"
503
- )
504
-
505
- consecutive_fail = 0 # 连续失败计数器
506
-
507
- while not self._shutdown_event.is_set():
508
- # 记录当前时间,作为本次心跳的基准
509
- current_time = time.time()
510
-
511
- try:
512
- # 检查注册状态(带锁读取)
513
- with self._state_lock:
514
- registered_status = self.registered
515
-
516
- if not registered_status:
517
- SYLogger.warning(
518
- f"nacos:服务未注册,跳过心跳 - 线程ID: {thread_ident}")
519
- consecutive_fail = 0
520
- else:
521
- # 发送心跳(10秒超时)
522
- success = self.send_heartbeat()
523
- if success:
524
- consecutive_fail = 0
525
- self._last_successful_heartbeat = current_time
526
- SYLogger.info(
527
- f"nacos:心跳发送成功 - 时间: {current_time:.3f}, "
528
- f"间隔: {self.heartbeat_interval}秒"
529
- )
530
- else:
531
- consecutive_fail += 1
532
- SYLogger.warning(
533
- f"nacos:心跳发送失败 - 连续失败: {consecutive_fail}次"
534
- )
535
- if consecutive_fail >= 5:
536
- SYLogger.error("nacos:心跳连续失败5次,尝试重连")
537
- self.reconnect_nacos_client()
538
- consecutive_fail = 0
539
-
540
- except Exception as e:
541
- consecutive_fail += 1
542
- SYLogger.error(
543
- f"nacos:心跳异常: {str(e)}, 连续失败: {consecutive_fail}次")
544
-
545
- # 计算下次执行时间(当前时间 + 配置间隔),确保间隔稳定
546
- next_run_time = current_time + self.heartbeat_interval
547
- sleep_time = max(0, next_run_time - time.time()
548
- ) # 避免负数(处理耗时超过间隔的情况)
549
- self._shutdown_event.wait(sleep_time) # 精准休眠至下次执行时间
550
-
551
- SYLogger.info(f"nacos:心跳循环已停止 - 线程ID: {thread_ident}")
552
-
553
- def send_heartbeat(self):
554
- """发送心跳并添加10秒超时控制(替换线程池实现)"""
555
- if not self.ensure_client_connected():
556
- SYLogger.warning("nacos:客户端未连接,心跳发送失败")
557
- return False
558
-
559
- # 用线程+join实现10秒超时控制
560
- result_list = [] # 用于线程间传递结果
561
-
562
- def heartbeat_task():
563
- """心跳实际执行任务"""
564
- try:
565
- result = self._send_heartbeat_internal()
566
- result_list.append(result)
567
- except Exception as e:
568
- SYLogger.error(f"nacos:心跳任务执行异常: {e}")
569
- result_list.append(False)
570
-
571
- # 启动心跳任务线程
572
- task_thread = threading.Thread(
573
- target=heartbeat_task,
574
- daemon=True,
575
- name="NacosHeartbeatTaskThread"
576
- )
577
- task_thread.start()
578
-
579
- # 等待线程完成,最多等待10秒
580
- task_thread.join(timeout=self.heartbeat_timeout)
581
-
582
- # 处理结果
583
- if not result_list:
584
- # 超时未返回
585
- SYLogger.error(f"nacos:心跳发送超时({self.heartbeat_timeout}秒)")
586
- self._client_initialized = False # 强制重连
587
- return False
588
-
589
- # 检查心跳结果
590
- if result_list[0]:
591
- self._last_successful_heartbeat = time.time()
592
- return result_list[0]
593
-
594
- def _send_heartbeat_internal(self):
595
- """实际的心跳发送逻辑"""
596
- result = self.nacos_client.send_heartbeat(
597
- service_name=self.service_name,
598
- ip=self.real_ip,
599
- port=int(self.port),
600
- cluster_name="DEFAULT",
601
- weight=1.0,
602
- metadata={"version": self.version} if self.version else None
603
- )
604
-
605
- # 处理返回结果
606
- if result and isinstance(result, dict) and result.get('lightBeatEnabled', False):
607
- SYLogger.info(f"nacos:心跳发送成功,Nacos返回: {result}")
608
- return True
609
- else:
610
- SYLogger.warning(f"nacos:心跳发送失败,Nacos返回: {result}")
611
- return False
612
-
613
- def reconnect_nacos_client(self):
614
- """重新连接Nacos客户端"""
615
- SYLogger.warning("nacos:尝试重新连接Nacos客户端")
616
- self._client_initialized = False
617
- return self.ensure_client_connected()
618
-
619
- def monitor_connection(self):
620
- """优化的连接监控线程,缩短检查间隔"""
621
- check_interval = self.connection_check_interval
622
- thread_start_time = time.time()
623
- check_counter = 0
624
-
625
- while not self._shutdown_event.is_set():
626
- try:
627
- current_time = time.time()
628
-
629
- SYLogger.info(
630
- f"nacos:连接监控线程运行中,检查间隔: {check_interval}s")
631
-
632
- # 检查客户端连接状态
633
- if not self.ensure_client_connected():
634
- SYLogger.warning("nacos:检测到Nacos客户端连接丢失,尝试重新初始化")
635
- self._initialize_client() # 尝试重新初始化客户端
636
-
637
- # 检查服务注册状态
638
- current_registered = self.check_service_registered()
639
-
640
- # 带锁更新注册状态
641
- with self._state_lock:
642
- if current_registered != self.registered:
643
- if current_registered:
644
- self.registered = True
645
- SYLogger.info(f"nacos:服务实例已重新注册")
646
- else:
647
- self.registered = False
648
- SYLogger.warning(f"nacos:服务实例未注册,尝试重新注册")
649
- # 启动临时线程执行重新注册(替换原线程池)
650
- retry_thread = threading.Thread(
651
- target=self.register_with_retry,
652
- daemon=True,
653
- name="NacosRetryRegisterThread"
654
- )
655
- retry_thread.start()
656
-
657
- # 20%的概率执行深度检查
658
- if random.random() < 0.2:
659
- self.verify_registration()
660
-
661
- # 每小时重置一次内部状态
662
- if current_time - thread_start_time > 3600:
663
- SYLogger.info("nacos:连接监控线程已运行1小时,重置内部状态")
664
- thread_start_time = current_time
665
- check_counter = 0
666
-
667
- check_counter += 1
668
- # 休眠指定时间
669
- self._shutdown_event.wait(check_interval)
670
- except Exception as e:
671
- SYLogger.error(f"nacos:连接监控异常: {e}")
672
- time.sleep(self.retry_delay)
673
-
674
123
  def get_service_ip(self, config_ip):
675
- """获取服务实际IP地址"""
124
+ """获取服务实际IP地址(保持原有逻辑)"""
676
125
  if config_ip in ['127.0.0.1', '0.0.0.0']:
677
126
  try:
678
127
  with socket.socket(socket.AF_INET, socket.SOCK_DGRAM) as s:
@@ -682,177 +131,21 @@ class NacosService(metaclass=SingletonMeta):
682
131
  return '127.0.0.1'
683
132
  return config_ip
684
133
 
685
- def deregister_service(self):
686
- """从Nacos注销服务"""
687
- with self._state_lock:
688
- if not self.registered or not self._client_initialized:
689
- return
690
-
691
- SYLogger.info("nacos:正在注销服务...")
692
- try:
693
- self.nacos_client.remove_naming_instance(
694
- service_name=self.service_name,
695
- ip=self.real_ip,
696
- port=int(self.port),
697
- cluster_name="DEFAULT"
698
- )
699
- with self._state_lock:
700
- self.registered = False
701
- SYLogger.info(f"nacos:服务 {self.service_name} 已注销")
702
- except Exception as e:
703
- SYLogger.error(f"nacos:注销服务时发生错误: {e}")
704
- finally:
705
- self._shutdown_event.set()
706
-
707
134
  def handle_signal(self, signum, frame):
708
- """处理退出信号"""
135
+ """处理退出信号(保持原有逻辑)"""
709
136
  SYLogger.info(f"nacos:收到信号 {signum},正在关闭服务...")
710
- self.deregister_service()
137
+ self.registration.deregister_service()
711
138
  sys.exit(0)
712
139
 
713
- def read_configs(self) -> dict:
714
- """读取共享配置"""
715
- configs = {}
716
- shared_configs = self.nacos_config.get('sharedConfigs', [])
717
-
718
- for config in shared_configs:
719
- data_id = config['dataId']
720
- group = config['group']
721
-
722
- for attempt in range(self.max_retries):
723
- try:
724
- # 检查客户端连接
725
- if not self.ensure_client_connected():
726
- self.reconnect_nacos_client()
727
-
728
- # 获取配置
729
- content = self.nacos_client.get_config(data_id, group)
730
-
731
- try:
732
- configs[data_id] = json.loads(content)
733
- except json.JSONDecodeError:
734
- try:
735
- configs[data_id] = yaml.safe_load(content)
736
- except yaml.YAMLError:
737
- SYLogger.error(f"nacos:无法解析 {data_id} 的内容")
738
- break
739
- except Exception as e:
740
- if attempt < self.max_retries - 1:
741
- SYLogger.warning(
742
- f"nacos:读取配置 {data_id} 失败 (尝试 {attempt+1}/{self.max_retries}): {e}")
743
- time.sleep(self.retry_delay)
744
- else:
745
- SYLogger.error(
746
- f"nacos:读取配置 {data_id} 失败,已达到最大重试次数: {e}")
747
-
748
- return configs
749
-
140
+ # 以下为兼容原有接口的封装方法
750
141
  def add_config_listener(self, data_id: str, callback: Callable[[str], None]):
751
- """添加配置变更监听器"""
752
- self._config_listeners[data_id] = callback
753
- # 初始获取一次配置
754
- if config := self.get_config(data_id):
755
- callback(config)
142
+ return self.config_manager.add_config_listener(data_id, callback)
756
143
 
757
144
  def get_config(self, data_id: str, group: str = "DEFAULT_GROUP") -> Optional[str]:
758
- """获取配置内容"""
759
- if not self.ensure_client_connected():
760
- return None
761
-
762
- try:
763
- return self.nacos_client.get_config(data_id, group=group)
764
- except Exception as e:
765
- SYLogger.error(f"nacos:获取配置 {data_id} 失败: {str(e)}")
766
- return None
767
-
768
- def _watch_configs(self):
769
- """配置监听线程"""
770
- check_interval = self.config_watch_interval
771
-
772
- while not self._shutdown_event.is_set():
773
- try:
774
- for data_id, callback in list(self._config_listeners.items()):
775
- new_config = self.get_config(data_id)
776
- if new_config and new_config != self._config_cache.get(data_id):
777
- # 直接执行回调(替换原线程池,配置回调通常为轻量操作)
778
- callback(new_config)
779
- self._config_cache[data_id] = new_config
780
- except Exception as e:
781
- SYLogger.error(f"nacos:配置监视线程异常: {str(e)}")
782
- self._shutdown_event.wait(check_interval)
145
+ return self.config_manager.get_config(data_id, group)
783
146
 
784
147
  def discover_services(self, service_name: str, group: str = "DEFAULT_GROUP", version: str = None) -> List[Dict]:
785
- """发现服务实例列表 (与Java格式兼容)"""
786
- if not self.ensure_client_connected():
787
- return []
788
-
789
- return self.get_service_instances(service_name, group, version)
148
+ return self.discovery.discover_services(service_name, group, version)
790
149
 
791
150
  def get_service_instances(self, service_name: str, group: str = "DEFAULT_GROUP", target_version: str = None) -> List[Dict]:
792
- """
793
- 获取服务实例列表,并按照以下优先级规则筛选:
794
- 1. 相同版本号的实例
795
- 2. 无版本号的实例
796
- 3. 所有实例中轮询
797
- """
798
- try:
799
- namespace_id = self.nacos_config['namespaceId']
800
- instances = self.nacos_client.list_naming_instance(
801
- service_name,
802
- namespace_id=namespace_id,
803
- group_name=group,
804
- healthy_only=True,
805
- )
806
-
807
- if not instances or 'hosts' not in instances:
808
- SYLogger.info(f"nacos:未发现 {service_name} 的服务实例")
809
- return []
810
-
811
- all_instances = instances.get('hosts', [])
812
- SYLogger.info(
813
- f"nacos:共发现 {len(all_instances)} 个 {service_name} 服务实例")
814
-
815
- # 确定要使用的目标版本,如果未指定则使用当前服务的版本
816
- version_to_use = target_version or self.version
817
-
818
- # 按规则筛选实例
819
- if version_to_use:
820
- # 1. 筛选相同版本号的实例
821
- same_version_instances = [
822
- instance for instance in all_instances
823
- if instance.get('metadata', {}).get('version') == version_to_use
824
- ]
825
-
826
- if same_version_instances:
827
- SYLogger.info(
828
- f"nacos:筛选出 {len(same_version_instances)} 个与当前版本({version_to_use})匹配的实例")
829
- return same_version_instances
830
-
831
- # 2. 如果没有相同版本的实例,筛选无版本号的实例
832
- no_version_instances = [
833
- instance for instance in all_instances
834
- if 'version' not in instance.get('metadata', {})
835
- ]
836
-
837
- if no_version_instances:
838
- SYLogger.info(
839
- f"nacos:未找到相同版本({version_to_use})的实例,筛选出 {len(no_version_instances)} 个无版本号的实例")
840
- return no_version_instances
841
-
842
- # 3. 如果没有指定版本或前两个规则都不满足,使用轮询方式选择所有健康实例
843
- SYLogger.info(
844
- f"nacos:使用轮询方式从 {len(all_instances)} 个实例中选择")
845
-
846
- # 线程安全地获取下一个轮询索引
847
- with self._round_robin_lock:
848
- selected_index = self._round_robin_index % len(all_instances)
849
- # 更新轮询索引,为下一次请求做准备
850
- self._round_robin_index = (
851
- selected_index + 1) % len(all_instances)
852
-
853
- # 返回包含当前选中实例的列表
854
- return [all_instances[selected_index]]
855
-
856
- except Exception as e:
857
- SYLogger.error(f"nacos:服务发现失败: {service_name}: {str(e)}")
858
- return []
151
+ return self.discovery.get_service_instances(service_name, group, target_version)