sycommon-python-lib 0.1.56b5__py3-none-any.whl → 0.1.57b4__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (38) hide show
  1. sycommon/config/Config.py +24 -3
  2. sycommon/config/LangfuseConfig.py +15 -0
  3. sycommon/config/SentryConfig.py +13 -0
  4. sycommon/llm/embedding.py +269 -50
  5. sycommon/llm/get_llm.py +9 -218
  6. sycommon/llm/struct_token.py +192 -0
  7. sycommon/llm/sy_langfuse.py +103 -0
  8. sycommon/llm/usage_token.py +117 -0
  9. sycommon/logging/kafka_log.py +187 -433
  10. sycommon/middleware/exception.py +10 -16
  11. sycommon/middleware/timeout.py +2 -1
  12. sycommon/middleware/traceid.py +81 -76
  13. sycommon/notice/uvicorn_monitor.py +32 -27
  14. sycommon/rabbitmq/rabbitmq_client.py +247 -242
  15. sycommon/rabbitmq/rabbitmq_pool.py +201 -123
  16. sycommon/rabbitmq/rabbitmq_service.py +25 -843
  17. sycommon/rabbitmq/rabbitmq_service_client_manager.py +211 -0
  18. sycommon/rabbitmq/rabbitmq_service_connection_monitor.py +73 -0
  19. sycommon/rabbitmq/rabbitmq_service_consumer_manager.py +285 -0
  20. sycommon/rabbitmq/rabbitmq_service_core.py +117 -0
  21. sycommon/rabbitmq/rabbitmq_service_producer_manager.py +238 -0
  22. sycommon/sentry/__init__.py +0 -0
  23. sycommon/sentry/sy_sentry.py +35 -0
  24. sycommon/services.py +122 -96
  25. sycommon/synacos/nacos_client_base.py +121 -0
  26. sycommon/synacos/nacos_config_manager.py +107 -0
  27. sycommon/synacos/nacos_heartbeat_manager.py +144 -0
  28. sycommon/synacos/nacos_service.py +63 -783
  29. sycommon/synacos/nacos_service_discovery.py +157 -0
  30. sycommon/synacos/nacos_service_registration.py +270 -0
  31. sycommon/tools/env.py +62 -0
  32. sycommon/tools/merge_headers.py +20 -0
  33. sycommon/tools/snowflake.py +101 -153
  34. {sycommon_python_lib-0.1.56b5.dist-info → sycommon_python_lib-0.1.57b4.dist-info}/METADATA +10 -8
  35. {sycommon_python_lib-0.1.56b5.dist-info → sycommon_python_lib-0.1.57b4.dist-info}/RECORD +38 -20
  36. {sycommon_python_lib-0.1.56b5.dist-info → sycommon_python_lib-0.1.57b4.dist-info}/WHEEL +0 -0
  37. {sycommon_python_lib-0.1.56b5.dist-info → sycommon_python_lib-0.1.57b4.dist-info}/entry_points.txt +0 -0
  38. {sycommon_python_lib-0.1.56b5.dist-info → sycommon_python_lib-0.1.57b4.dist-info}/top_level.txt +0 -0
@@ -1,19 +1,20 @@
1
1
  import threading
2
- import json
3
- from typing import Callable, Dict, List, Optional
4
- import nacos
5
2
  import socket
6
3
  import signal
7
4
  import sys
8
5
  import os
9
- import yaml
10
6
  import time
11
- import atexit
12
- import random
13
-
7
+ from typing import Callable, Dict, List, Optional
14
8
  from sycommon.config.Config import Config, SingletonMeta
15
9
  from sycommon.logging.kafka_log import SYLogger
16
10
 
11
+ from sycommon.synacos.nacos_client_base import NacosClientBase
12
+ from sycommon.synacos.nacos_service_registration import NacosServiceRegistration
13
+ from sycommon.synacos.nacos_heartbeat_manager import NacosHeartbeatManager
14
+ from sycommon.synacos.nacos_config_manager import NacosConfigManager
15
+ from sycommon.synacos.nacos_service_discovery import NacosServiceDiscovery
16
+ from sycommon.tools.env import check_env_flag, get_env_var
17
+
17
18
 
18
19
  class NacosService(metaclass=SingletonMeta):
19
20
  def __init__(self, config):
@@ -23,410 +24,65 @@ class NacosService(metaclass=SingletonMeta):
23
24
  self.service_name = config['Name']
24
25
  self.host = config['Host']
25
26
  self.port = config['Port']
26
- self.version = os.getenv('VERSION')
27
- self.enable_register_nacos = os.getenv(
28
- 'REGISTER-NACOS', 'true').lower() == 'true'
29
- self.registered = False
30
- self._client_initialized = False # 客户端初始化状态
31
- self._shutdown_event = threading.Event()
32
-
33
- # 添加可重入锁用于状态同步
34
- self._state_lock = threading.RLock()
27
+ self.version = get_env_var('VERSION')
28
+ self.enable_register_nacos = check_env_flag(
29
+ ['REGISTER-NACOS'], 'true')
35
30
 
36
- # 配置参数
37
- self.max_retries = self.nacos_config.get('maxRetries', 5)
38
- self.retry_delay = self.nacos_config.get('retryDelay', 5)
39
- self.max_retry_delay = self.nacos_config.get('maxRetryDelay', 30)
40
- # 心跳间隔:优先从配置读取,默认15秒(可通过配置修改)
41
- self.heartbeat_interval = self.nacos_config.get(
42
- 'heartbeatInterval', 15)
43
- # 心跳超时:固定设置为15秒
44
- self.heartbeat_timeout = 15
45
- self.register_retry_interval = self.nacos_config.get(
46
- 'registerRetryInterval', 15) # 注册重试间隔
47
-
48
- # 长期重试配置
49
- self.long_term_retry_delay = self.nacos_config.get(
50
- 'longTermRetryDelay', 30)
51
- self.max_long_term_retries = self.nacos_config.get(
52
- 'maxLongTermRetries', -1) # -1表示无限重试
53
-
54
- # 注册验证配置:优化默认值(增加次数+延长间隔)
55
- self.registration_verify_count = self.nacos_config.get(
56
- 'registrationVerifyCount', 1) # 验证次数
57
- self.registration_verify_interval = self.nacos_config.get(
58
- 'registrationVerifyInterval', 1) # 验证间隔
59
- self.registration_post_delay = self.nacos_config.get(
60
- 'registrationPostDelay', 3) # 注册后延迟3秒再开始验证
31
+ # 初始化基础模块
32
+ self.client_base = NacosClientBase(
33
+ self.nacos_config, self.enable_register_nacos)
61
34
 
35
+ # 获取真实IP
62
36
  self.real_ip = self.get_service_ip(self.host)
63
- self._long_term_retry_count = 0 # 长期重试计数器
64
37
 
65
- # 轮询索引,用于在所有实例中进行轮询选择
66
- self._round_robin_index = 0
67
- self._round_robin_lock = threading.Lock() # 保护轮询索引的线程安全
38
+ # 初始化各功能模块
39
+ self.registration = NacosServiceRegistration(
40
+ self.client_base, self.service_name, self.real_ip, self.port, self.version
41
+ )
42
+ self.config_manager = NacosConfigManager(self.client_base)
43
+ self.discovery = NacosServiceDiscovery(self.client_base)
44
+
45
+ # 心跳间隔配置
46
+ self.heartbeat_interval = self.nacos_config.get(
47
+ 'heartbeatInterval', 15)
48
+ self.heartbeat_manager = NacosHeartbeatManager(
49
+ self.client_base, self.registration, self.heartbeat_interval
50
+ )
68
51
 
69
52
  if self.enable_register_nacos:
70
- # 初始化客户端(仅在首次调用时执行)
71
- self._initialize_client()
72
- # 启动时清理残留实例
73
- self._cleanup_stale_instance()
53
+ # 初始化客户端
54
+ self.client_base._initialize_client()
55
+ # 清理残留实例
56
+ self.registration._cleanup_stale_instance()
74
57
  else:
75
58
  SYLogger.info("nacos:本地开发模式,不初始化Nacos客户端")
76
59
 
77
- self.share_configs = self.read_configs()
78
- # 设置llm相关配置
60
+ # 读取配置并设置到全局配置
61
+ self.share_configs = self.config_manager.read_configs(
62
+ self.nacos_config.get('sharedConfigs', []))
79
63
  Config().set_attr(self.share_configs)
80
64
 
81
- # 配置监听器
82
- self._config_listeners = {}
83
- self._config_cache = {}
84
-
85
- # 心跳相关
86
- self._last_heartbeat_time = 0
87
- self._heartbeat_fail_count = 0
88
- self._heartbeat_lock = threading.Lock()
89
- self._heartbeat_thread = None
90
-
91
- self.max_heartbeat_timeout = self.nacos_config.get(
92
- 'maxHeartbeatTimeout', 30)
93
- self._last_successful_heartbeat = time.time()
94
- # 连接监控检查间隔(新增配置,默认30秒,避免硬编码)
95
- self.connection_check_interval = self.nacos_config.get(
96
- 'connectionCheckInterval', 30)
97
- # 配置监视线程检查间隔(默认30秒)
98
- self.config_watch_interval = self.nacos_config.get(
99
- 'configWatchInterval', 30)
100
-
101
65
  # 启动配置监视线程
102
- self._watch_thread = threading.Thread(
103
- target=self._watch_configs, daemon=True)
104
- self._watch_thread.start()
66
+ self.config_manager.start_watch_configs()
105
67
 
106
- # 仅在需要注册时启动心跳和监控线程
68
+ # 仅在需要注册时启动心跳
107
69
  if self.enable_register_nacos:
108
- # 启动心跳线程
109
- self.start_heartbeat()
70
+ self.heartbeat_manager.start_heartbeat()
110
71
  else:
111
72
  SYLogger.info("nacos:本地开发模式,不启动心跳和监控线程")
112
73
 
113
- def _initialize_client(self):
114
- """初始化Nacos客户端(仅首次调用时执行)"""
115
- if self._client_initialized:
116
- return True
117
-
118
- for attempt in range(self.max_retries):
119
- try:
120
- register_ip = self.nacos_config['registerIp']
121
- namespace_id = self.nacos_config['namespaceId']
122
- self.nacos_client = nacos.NacosClient(
123
- server_addresses=register_ip,
124
- namespace=namespace_id
125
- )
126
- SYLogger.info("nacos:客户端初始化成功")
127
- self._client_initialized = True
128
- return True
129
- except Exception as e:
130
- delay = min(self.retry_delay, self.max_retry_delay)
131
- SYLogger.error(
132
- f"nacos:客户端初始化失败 (尝试 {attempt+1}/{self.max_retries}): {e}")
133
- time.sleep(delay)
134
-
135
- SYLogger.warning("nacos:无法连接到 Nacos 服务器,已达到最大重试次数")
136
- return False
137
-
138
- def _cleanup_stale_instance(self):
139
- """清理可能存在的残留实例"""
140
- if not self._client_initialized:
141
- return
142
-
143
- try:
144
- self.nacos_client.remove_naming_instance(
145
- service_name=self.service_name,
146
- ip=self.real_ip,
147
- port=int(self.port),
148
- cluster_name="DEFAULT"
149
- )
150
- SYLogger.warning(f"nacos:清理残留实例: {self.real_ip}:{self.port}")
151
- except Exception as e:
152
- SYLogger.error(f"nacos:清理残留实例异常: {e}")
153
-
154
- def ensure_client_connected(self, retry_once=False):
155
- """确保Nacos客户端已连接,返回连接状态"""
156
- # 使用线程锁保护客户端初始化状态
157
- with self._state_lock:
158
- if self._client_initialized:
159
- return True
160
-
161
- SYLogger.warning("nacos:客户端未初始化,尝试连接...")
162
-
163
- # 记录尝试次数,避免无限循环
164
- attempt = 0
165
- max_attempts = 2 if retry_once else self.max_retries
166
-
167
- while attempt < max_attempts:
168
- try:
169
- register_ip = self.nacos_config['registerIp']
170
- namespace_id = self.nacos_config['namespaceId']
171
-
172
- # 创建新的Nacos客户端实例
173
- self.nacos_client = nacos.NacosClient(
174
- server_addresses=register_ip,
175
- namespace=namespace_id
176
- )
177
-
178
- # 验证客户端是否真正可用
179
- connection_valid = self._verify_client_connection()
180
-
181
- if connection_valid:
182
- self._client_initialized = True
183
- SYLogger.info("nacos:客户端初始化成功")
184
-
185
- # 客户端重新连接后,检查服务注册状态
186
- self.registered = self.check_service_registered()
187
- return True
188
- else:
189
- raise ConnectionError("nacos:客户端初始化后无法验证连接")
190
-
191
- except Exception as e:
192
- attempt += 1
193
- delay = min(self.retry_delay, self.max_retry_delay)
194
-
195
- SYLogger.error(
196
- f"nacos:客户端初始化失败 (尝试 {attempt}/{max_attempts}): {e}")
197
- time.sleep(delay)
198
-
199
- SYLogger.error("nacos:无法连接到 Nacos 服务器,已达到最大重试次数")
200
- return False
201
-
202
- def _verify_client_connection(self):
203
- """验证客户端是否真正连接成功"""
204
- # 本地开发模式下直接返回True,不进行实际验证
205
- if not self.enable_register_nacos:
206
- return True
207
-
208
- try:
209
- # 使用当前服务的命名实例查询来验证连接
210
- namespace_id = self.nacos_config['namespaceId']
211
- self.nacos_client.list_naming_instance(
212
- service_name=self.service_name,
213
- namespace_id=namespace_id,
214
- group_name="DEFAULT_GROUP",
215
- healthy_only=True
216
- )
217
- return True
218
- except Exception as e:
219
- SYLogger.warning(f"nacos:客户端连接验证失败: {e}")
220
- return False
221
-
222
- def check_service_registered(self):
223
- """检查服务是否已注册(基于实例列表)"""
224
- # 本地开发模式下直接返回True,模拟已注册状态
225
- if not self.enable_register_nacos:
226
- return True
227
-
228
- if not self.ensure_client_connected():
229
- return False
230
-
231
- try:
232
- namespace_id = self.nacos_config['namespaceId']
233
- instances = self.nacos_client.list_naming_instance(
234
- service_name=self.service_name,
235
- namespace_id=namespace_id,
236
- group_name="DEFAULT_GROUP",
237
- healthy_only=True,
238
- )
239
-
240
- # 检查是否存在包含当前IP和端口的实例
241
- found = False
242
- for instance in instances.get('hosts', []):
243
- if (instance.get('ip') == self.real_ip and
244
- instance.get('port') == int(self.port)):
245
- SYLogger.info(f"nacos:找到已注册实例: {self.real_ip}:{self.port}")
246
- found = True
247
- break
248
-
249
- if not found:
250
- SYLogger.warning(f"nacos:未找到注册实例: {self.real_ip}:{self.port}")
251
-
252
- # 带锁更新注册状态
253
- with self._state_lock:
254
- self.registered = found
255
-
256
- return found
257
- except Exception as e:
258
- SYLogger.error(f"nacos:检查服务注册状态失败: {e}")
259
- return False
260
-
261
- def verify_registration(self):
262
- """多次验证服务是否成功注册"""
263
- success_count = 0
264
- SYLogger.info(
265
- f"nacos:开始验证服务注册状态,共验证 {self.registration_verify_count} 次")
266
-
267
- for i in range(self.registration_verify_count):
268
- if self.check_service_registered():
269
- success_count += 1
270
- else:
271
- SYLogger.warning(f"nacos:第 {i+1} 次验证未找到注册实例")
272
-
273
- if i < self.registration_verify_count - 1:
274
- time.sleep(self.registration_verify_interval)
275
-
276
- if success_count >= self.registration_verify_count / 2:
277
- SYLogger.info(
278
- f"nacos:服务注册验证成功,{success_count}/{self.registration_verify_count} 次验证通过")
279
- return True
280
- else:
281
- SYLogger.error(
282
- f"nacos:服务注册验证失败,仅 {success_count}/{self.registration_verify_count} 次验证通过")
283
- return False
284
-
285
- def register_with_retry(self):
286
- """带重试机制的服务注册(基于实例列表检查)"""
287
- retry_count = 0
288
- last_error = None
289
-
290
- # 带锁重置注册状态
291
- with self._state_lock:
292
- self.registered = False
293
-
294
- while (not self.registered) and (self.max_long_term_retries < 0 or retry_count < self.max_long_term_retries):
295
- # 增加状态检查点,防止重复注册
296
- with self._state_lock:
297
- if self.registered:
298
- return True
299
-
300
- try:
301
- # 尝试注册服务
302
- register_success = self.register(force=True)
303
-
304
- if not register_success:
305
- raise RuntimeError("nacos:服务注册请求失败")
306
-
307
- # 关键优化1:注册请求发送后,延迟一段时间再验证(默认3秒)
308
- SYLogger.info(
309
- f"nacos:服务注册请求已发送,延迟 {self.registration_post_delay} 秒后开始验证(确保Nacos服务器完成实例写入)")
310
- time.sleep(self.registration_post_delay)
311
-
312
- # 关键优化2:多次验证服务是否真正注册成功(默认3次,每次间隔2秒)
313
- registered = self.verify_registration()
314
-
315
- # 带锁更新注册状态
316
- with self._state_lock:
317
- self.registered = registered
318
-
319
- # 再次检查状态,防止其他线程修改
320
- with self._state_lock:
321
- if self.registered:
322
- # 注册成功后,更新客户端状态
323
- self._client_initialized = True
324
-
325
- # 注册成功后,通知心跳线程立即发送心跳
326
- self._shutdown_event.set()
327
- self._shutdown_event.clear()
328
-
329
- # 注册成功后,更新监控线程的状态
330
- self._long_term_retry_count = 0
331
-
332
- SYLogger.info(
333
- f"nacos:服务注册成功并通过验证: {self.service_name}")
334
- return True
335
- else:
336
- raise RuntimeError("nacos:服务注册验证失败")
337
-
338
- except Exception as e:
339
- last_error = str(e)
340
- retry_count += 1
341
- delay = min(self.register_retry_interval, self.max_retry_delay)
342
-
343
- SYLogger.warning(
344
- f"nacos:服务注册尝试 {retry_count} 失败: {last_error},{delay}秒后重试")
345
- time.sleep(delay)
346
-
347
- # 最终检查,防止在最后一次重试后其他线程成功注册
348
- with self._state_lock:
349
- if self.registered:
350
- return True
351
-
352
- # 确实注册失败
353
- if last_error:
354
- SYLogger.error(f"nacos:服务注册失败,最终错误: {last_error}")
355
- else:
356
- SYLogger.error(f"nacos:服务注册失败,已达到最大重试次数: {self.service_name}")
357
-
358
- return False
359
-
360
- def register(self, force=False):
361
- """注册服务到Nacos"""
362
- # 使用状态锁保护注册状态
363
- with self._state_lock:
364
- if self.registered and not force and self.check_service_registered():
365
- return True
366
-
367
- if self.registered and not force:
368
- self.registered = False
369
- SYLogger.warning("nacos:本地状态显示已注册,但Nacos中未找到服务实例,准备重新注册")
370
-
371
- metadata = {
372
- "ignore-metrics": "true",
373
- # "preserved.heart.beat.interval": "3000", # 心跳间隔 3 秒
374
- # "preserved.heart.beat.timeout": "15000", # 心跳超时 15 秒
375
- # "preserved.ip.delete.timeout": "30000" # 实例删除超时 30 秒
376
- }
377
- if self.version:
378
- metadata["version"] = self.version
379
-
380
- for attempt in range(self.max_retries):
381
- if not self.ensure_client_connected():
382
- return False
383
-
384
- try:
385
- # 注册服务
386
- self.nacos_client.add_naming_instance(
387
- service_name=self.service_name,
388
- ip=self.real_ip,
389
- port=int(self.port),
390
- metadata=metadata,
391
- cluster_name="DEFAULT",
392
- healthy=True,
393
- ephemeral=True,
394
- heartbeat_interval=self.heartbeat_interval
395
- )
396
- SYLogger.info(
397
- f"nacos:服务 {self.service_name} 注册请求已发送: {self.real_ip}:{self.port}")
398
-
399
- # 注册退出时的清理函数
400
- if not hasattr(self, '_atexit_registered') or not self._atexit_registered:
401
- atexit.register(self.deregister_service)
402
- self._atexit_registered = True
403
-
404
- return True
405
- except Exception as e:
406
- if "signal only works in main thread" in str(e):
407
- return True
408
- elif attempt < self.max_retries - 1:
409
- SYLogger.warning(
410
- f"nacos:服务注册失败 (尝试 {attempt+1}/{self.max_retries}): {e}")
411
- time.sleep(self.retry_delay)
412
- else:
413
- SYLogger.error(f"nacos:服务注册失败,已达到最大重试次数: {e}")
414
- return False
415
-
416
74
  @staticmethod
417
75
  def setup_nacos(config: dict):
418
- """创建并初始化Nacos管理器"""
76
+ """创建并初始化Nacos管理器(保持原有接口)"""
419
77
  instance = NacosService(config)
420
78
 
421
- # 仅在需要注册时执行注册逻辑
422
79
  if instance.enable_register_nacos:
423
- # 使用带超时的等待机制,而不是单次尝试
424
- timeout = 60 # 60秒超时
80
+ # 启动注册线程
81
+ timeout = 60
425
82
  start_time = time.time()
426
83
 
427
- # 启动注册线程,不阻塞主线程(替换原线程池)
428
84
  register_thread = threading.Thread(
429
- target=instance.register_with_retry,
85
+ target=instance.registration.register_with_retry,
430
86
  daemon=True,
431
87
  name="NacosRegisterThread"
432
88
  )
@@ -434,244 +90,38 @@ class NacosService(metaclass=SingletonMeta):
434
90
 
435
91
  # 等待注册完成或超时
436
92
  while True:
437
- # 带锁检查状态
438
- with instance._state_lock:
439
- if instance.registered:
440
- break
93
+ if instance.registration.registered:
94
+ break
441
95
 
442
96
  if time.time() - start_time >= timeout:
443
- # 超时处理
444
97
  break
445
98
 
446
99
  time.sleep(1)
447
100
 
448
101
  # 最终状态检查
449
- with instance._state_lock:
450
- if not instance.registered:
451
- # 清理并抛出异常
452
- try:
453
- instance.deregister_service()
454
- except Exception as e:
455
- SYLogger.error(f"nacos:服务注册失败后,注销服务时发生错误: {e}")
456
- raise RuntimeError("nacos:服务注册失败,应用启动终止")
102
+ if not instance.registration.registered:
103
+ try:
104
+ instance.registration.deregister_service()
105
+ except Exception as e:
106
+ SYLogger.error(f"nacos:服务注册失败后,注销服务时发生错误: {e}")
107
+ raise RuntimeError("nacos:服务注册失败,应用启动终止")
457
108
 
458
- # 服务注册成功后再注册信号处理
109
+ # 注册信号处理
459
110
  signal.signal(signal.SIGTERM, instance.handle_signal)
460
111
  signal.signal(signal.SIGINT, instance.handle_signal)
461
112
 
462
113
  # 启动连接监控线程
463
- threading.Thread(target=instance.monitor_connection,
464
- daemon=True, name="NacosConnectionMonitorThread").start()
114
+ threading.Thread(target=instance.discovery.monitor_connection,
115
+ args=(instance.registration,),
116
+ daemon=True,
117
+ name="NacosConnectionMonitorThread").start()
465
118
  else:
466
119
  SYLogger.info("nacos:本地开发模式,跳过服务注册流程")
467
120
 
468
121
  return instance
469
122
 
470
- def start_heartbeat(self):
471
- """启动心跳线程(确保单例)"""
472
- with self._heartbeat_lock: # 加锁确保线程安全
473
- # 双重检查:先判断线程是否已存在且存活
474
- if self._heartbeat_thread is not None and self._heartbeat_thread.is_alive():
475
- return
476
-
477
- # 彻底清理可能的残留线程引用
478
- self._heartbeat_thread = None
479
-
480
- # 创建新的心跳线程
481
- self._heartbeat_thread = threading.Thread(
482
- target=self._send_heartbeat_loop,
483
- name="NacosHeartbeatThread",
484
- daemon=True
485
- )
486
- self._heartbeat_thread.daemon = True
487
- self._heartbeat_thread.start()
488
- SYLogger.info(
489
- f"nacos:心跳线程启动,线程ID: {self._heartbeat_thread.ident},"
490
- f"心跳间隔: {self.heartbeat_interval}秒,"
491
- f"心跳超时: {self.heartbeat_timeout}秒"
492
- )
493
-
494
- def _send_heartbeat_loop(self):
495
- """优化后的心跳发送循环,确保严格按间隔执行"""
496
- current_thread = threading.current_thread()
497
- thread_ident = current_thread.ident
498
- SYLogger.info(
499
- f"nacos:心跳循环启动 - 线程ID: {thread_ident}, "
500
- f"配置间隔: {self.heartbeat_interval}秒, "
501
- f"超时时间: {self.heartbeat_timeout}秒"
502
- )
503
-
504
- consecutive_fail = 0 # 连续失败计数器
505
-
506
- while not self._shutdown_event.is_set():
507
- # 记录当前时间,作为本次心跳的基准
508
- current_time = time.time()
509
-
510
- try:
511
- # 检查注册状态(带锁读取)
512
- with self._state_lock:
513
- registered_status = self.registered
514
-
515
- if not registered_status:
516
- SYLogger.warning(
517
- f"nacos:服务未注册,跳过心跳 - 线程ID: {thread_ident}")
518
- consecutive_fail = 0
519
- else:
520
- # 发送心跳(10秒超时)
521
- success = self.send_heartbeat()
522
- if success:
523
- consecutive_fail = 0
524
- self._last_successful_heartbeat = current_time
525
- SYLogger.info(
526
- f"nacos:心跳发送成功 - 时间: {current_time:.3f}, "
527
- f"间隔: {self.heartbeat_interval}秒"
528
- )
529
- else:
530
- consecutive_fail += 1
531
- SYLogger.warning(
532
- f"nacos:心跳发送失败 - 连续失败: {consecutive_fail}次"
533
- )
534
- if consecutive_fail >= 5:
535
- SYLogger.error("nacos:心跳连续失败5次,尝试重连")
536
- self.reconnect_nacos_client()
537
- consecutive_fail = 0
538
-
539
- except Exception as e:
540
- consecutive_fail += 1
541
- SYLogger.error(
542
- f"nacos:心跳异常: {str(e)}, 连续失败: {consecutive_fail}次")
543
-
544
- # 计算下次执行时间(当前时间 + 配置间隔),确保间隔稳定
545
- next_run_time = current_time + self.heartbeat_interval
546
- sleep_time = max(0, next_run_time - time.time()
547
- ) # 避免负数(处理耗时超过间隔的情况)
548
- self._shutdown_event.wait(sleep_time) # 精准休眠至下次执行时间
549
-
550
- SYLogger.info(f"nacos:心跳循环已停止 - 线程ID: {thread_ident}")
551
-
552
- def send_heartbeat(self):
553
- """发送心跳并添加10秒超时控制(替换线程池实现)"""
554
- if not self.ensure_client_connected():
555
- SYLogger.warning("nacos:客户端未连接,心跳发送失败")
556
- return False
557
-
558
- # 用线程+join实现10秒超时控制
559
- result_list = [] # 用于线程间传递结果
560
-
561
- def heartbeat_task():
562
- """心跳实际执行任务"""
563
- try:
564
- result = self._send_heartbeat_internal()
565
- result_list.append(result)
566
- except Exception as e:
567
- SYLogger.error(f"nacos:心跳任务执行异常: {e}")
568
- result_list.append(False)
569
-
570
- # 启动心跳任务线程
571
- task_thread = threading.Thread(
572
- target=heartbeat_task,
573
- daemon=True,
574
- name="NacosHeartbeatTaskThread"
575
- )
576
- task_thread.start()
577
-
578
- # 等待线程完成,最多等待10秒
579
- task_thread.join(timeout=self.heartbeat_timeout)
580
-
581
- # 处理结果
582
- if not result_list:
583
- # 超时未返回
584
- SYLogger.error(f"nacos:心跳发送超时({self.heartbeat_timeout}秒)")
585
- self._client_initialized = False # 强制重连
586
- return False
587
-
588
- # 检查心跳结果
589
- if result_list[0]:
590
- self._last_successful_heartbeat = time.time()
591
- return result_list[0]
592
-
593
- def _send_heartbeat_internal(self):
594
- """实际的心跳发送逻辑"""
595
- result = self.nacos_client.send_heartbeat(
596
- service_name=self.service_name,
597
- ip=self.real_ip,
598
- port=int(self.port),
599
- cluster_name="DEFAULT",
600
- weight=1.0,
601
- metadata={"version": self.version} if self.version else None
602
- )
603
-
604
- # 处理返回结果
605
- if result and isinstance(result, dict) and result.get('lightBeatEnabled', False):
606
- SYLogger.info(f"nacos:心跳发送成功,Nacos返回: {result}")
607
- return True
608
- else:
609
- SYLogger.warning(f"nacos:心跳发送失败,Nacos返回: {result}")
610
- return False
611
-
612
- def reconnect_nacos_client(self):
613
- """重新连接Nacos客户端"""
614
- SYLogger.warning("nacos:尝试重新连接Nacos客户端")
615
- self._client_initialized = False
616
- return self.ensure_client_connected()
617
-
618
- def monitor_connection(self):
619
- """优化的连接监控线程,缩短检查间隔"""
620
- check_interval = self.connection_check_interval
621
- thread_start_time = time.time()
622
- check_counter = 0
623
-
624
- while not self._shutdown_event.is_set():
625
- try:
626
- current_time = time.time()
627
-
628
- SYLogger.info(
629
- f"nacos:连接监控线程运行中,检查间隔: {check_interval}s")
630
-
631
- # 检查客户端连接状态
632
- if not self.ensure_client_connected():
633
- SYLogger.warning("nacos:检测到Nacos客户端连接丢失,尝试重新初始化")
634
- self._initialize_client() # 尝试重新初始化客户端
635
-
636
- # 检查服务注册状态
637
- current_registered = self.check_service_registered()
638
-
639
- # 带锁更新注册状态
640
- with self._state_lock:
641
- if current_registered != self.registered:
642
- if current_registered:
643
- self.registered = True
644
- SYLogger.info(f"nacos:服务实例已重新注册")
645
- else:
646
- self.registered = False
647
- SYLogger.warning(f"nacos:服务实例未注册,尝试重新注册")
648
- # 启动临时线程执行重新注册(替换原线程池)
649
- retry_thread = threading.Thread(
650
- target=self.register_with_retry,
651
- daemon=True,
652
- name="NacosRetryRegisterThread"
653
- )
654
- retry_thread.start()
655
-
656
- # 20%的概率执行深度检查
657
- if random.random() < 0.2:
658
- self.verify_registration()
659
-
660
- # 每小时重置一次内部状态
661
- if current_time - thread_start_time > 3600:
662
- SYLogger.info("nacos:连接监控线程已运行1小时,重置内部状态")
663
- thread_start_time = current_time
664
- check_counter = 0
665
-
666
- check_counter += 1
667
- # 休眠指定时间
668
- self._shutdown_event.wait(check_interval)
669
- except Exception as e:
670
- SYLogger.error(f"nacos:连接监控异常: {e}")
671
- time.sleep(self.retry_delay)
672
-
673
123
  def get_service_ip(self, config_ip):
674
- """获取服务实际IP地址"""
124
+ """获取服务实际IP地址(保持原有逻辑)"""
675
125
  if config_ip in ['127.0.0.1', '0.0.0.0']:
676
126
  try:
677
127
  with socket.socket(socket.AF_INET, socket.SOCK_DGRAM) as s:
@@ -681,191 +131,21 @@ class NacosService(metaclass=SingletonMeta):
681
131
  return '127.0.0.1'
682
132
  return config_ip
683
133
 
684
- def deregister_service(self):
685
- """从Nacos注销服务"""
686
- with self._state_lock:
687
- if not self.registered or not self._client_initialized:
688
- return
689
-
690
- SYLogger.info("nacos:正在注销服务...")
691
- try:
692
- self.nacos_client.remove_naming_instance(
693
- service_name=self.service_name,
694
- ip=self.real_ip,
695
- port=int(self.port),
696
- cluster_name="DEFAULT"
697
- )
698
- with self._state_lock:
699
- self.registered = False
700
- SYLogger.info(f"nacos:服务 {self.service_name} 已注销")
701
- except Exception as e:
702
- SYLogger.error(f"nacos:注销服务时发生错误: {e}")
703
- finally:
704
- self._shutdown_event.set()
705
-
706
134
  def handle_signal(self, signum, frame):
707
- """处理退出信号"""
135
+ """处理退出信号(保持原有逻辑)"""
708
136
  SYLogger.info(f"nacos:收到信号 {signum},正在关闭服务...")
709
- self.deregister_service()
137
+ self.registration.deregister_service()
710
138
  sys.exit(0)
711
139
 
712
- def read_configs(self) -> dict:
713
- """读取共享配置"""
714
- configs = {}
715
- shared_configs = self.nacos_config.get('sharedConfigs', [])
716
-
717
- for config in shared_configs:
718
- data_id = config['dataId']
719
- group = config['group']
720
-
721
- for attempt in range(self.max_retries):
722
- try:
723
- # 检查客户端连接
724
- if not self.ensure_client_connected():
725
- self.reconnect_nacos_client()
726
-
727
- # 获取配置
728
- content = self.nacos_client.get_config(data_id, group)
729
-
730
- try:
731
- configs[data_id] = json.loads(content)
732
- except json.JSONDecodeError:
733
- try:
734
- configs[data_id] = yaml.safe_load(content)
735
- except yaml.YAMLError:
736
- SYLogger.error(f"nacos:无法解析 {data_id} 的内容")
737
- break
738
- except Exception as e:
739
- if attempt < self.max_retries - 1:
740
- SYLogger.warning(
741
- f"nacos:读取配置 {data_id} 失败 (尝试 {attempt+1}/{self.max_retries}): {e}")
742
- time.sleep(self.retry_delay)
743
- else:
744
- SYLogger.error(
745
- f"nacos:读取配置 {data_id} 失败,已达到最大重试次数: {e}")
746
-
747
- return configs
748
-
140
+ # 以下为兼容原有接口的封装方法
749
141
  def add_config_listener(self, data_id: str, callback: Callable[[str], None]):
750
- """添加配置变更监听器"""
751
- self._config_listeners[data_id] = callback
752
- # 初始获取一次配置
753
- if config := self.get_config(data_id):
754
- callback(config)
142
+ return self.config_manager.add_config_listener(data_id, callback)
755
143
 
756
144
  def get_config(self, data_id: str, group: str = "DEFAULT_GROUP") -> Optional[str]:
757
- """获取配置内容"""
758
- if not self.ensure_client_connected():
759
- return None
760
-
761
- try:
762
- return self.nacos_client.get_config(data_id, group=group)
763
- except Exception as e:
764
- SYLogger.error(f"nacos:获取配置 {data_id} 失败: {str(e)}")
765
- return None
766
-
767
- def _watch_configs(self):
768
- """配置监听线程"""
769
- check_interval = self.config_watch_interval
770
-
771
- while not self._shutdown_event.is_set():
772
- try:
773
- for data_id, callback in list(self._config_listeners.items()):
774
- new_config = self.get_config(data_id)
775
- if new_config and new_config != self._config_cache.get(data_id):
776
- # 直接执行回调(替换原线程池,配置回调通常为轻量操作)
777
- callback(new_config)
778
- self._config_cache[data_id] = new_config
779
- try:
780
- self.share_configs[data_id] = json.loads(
781
- new_config)
782
- except json.JSONDecodeError:
783
- try:
784
- self.share_configs[data_id] = yaml.safe_load(
785
- new_config)
786
- except yaml.YAMLError:
787
- SYLogger.error(f"nacos:无法解析 {data_id} 的内容")
788
- except Exception as e:
789
- SYLogger.error(f"nacos:配置监视线程异常: {str(e)}")
790
- self._shutdown_event.wait(check_interval)
145
+ return self.config_manager.get_config(data_id, group)
791
146
 
792
147
  def discover_services(self, service_name: str, group: str = "DEFAULT_GROUP", version: str = None) -> List[Dict]:
793
- """发现服务实例列表 (与Java格式兼容)"""
794
- if not self.ensure_client_connected():
795
- return []
796
-
797
- return self.get_service_instances(service_name, group, version)
148
+ return self.discovery.discover_services(service_name, group, version)
798
149
 
799
150
  def get_service_instances(self, service_name: str, group: str = "DEFAULT_GROUP", target_version: str = None) -> List[Dict]:
800
- """
801
- 获取服务实例列表,并按照以下优先级规则筛选:
802
- 1. 相同版本号的实例
803
- 2. 无版本号的实例
804
- 3. 所有实例中轮询
805
- """
806
- try:
807
- namespace_id = self.nacos_config['namespaceId']
808
- instances = self.nacos_client.list_naming_instance(
809
- service_name,
810
- namespace_id=namespace_id,
811
- group_name=group,
812
- healthy_only=True,
813
- )
814
-
815
- if not instances or 'hosts' not in instances:
816
- SYLogger.info(f"nacos:未发现 {service_name} 的服务实例")
817
- return []
818
-
819
- all_instances = instances.get('hosts', [])
820
- # 筛选已上线实例
821
- all_instances = [
822
- instance for instance in all_instances
823
- if instance.get('enabled', True) # 默认True担心阿里变更sdk
824
- ]
825
- SYLogger.info(
826
- f"nacos:共发现 {len(all_instances)} 个 {service_name} 服务实例")
827
-
828
- # 确定要使用的目标版本,如果未指定则使用当前服务的版本
829
- version_to_use = target_version or self.version
830
-
831
- # 按规则筛选实例
832
- if version_to_use:
833
- # 1. 筛选相同版本号的实例
834
- same_version_instances = [
835
- instance for instance in all_instances
836
- if instance.get('metadata', {}).get('version') == version_to_use
837
- ]
838
-
839
- if same_version_instances:
840
- SYLogger.info(
841
- f"nacos:筛选出 {len(same_version_instances)} 个与当前版本({version_to_use})匹配的实例")
842
- return same_version_instances
843
-
844
- # 2. 如果没有相同版本的实例,筛选无版本号的实例
845
- no_version_instances = [
846
- instance for instance in all_instances
847
- if 'version' not in instance.get('metadata', {})
848
- ]
849
-
850
- if no_version_instances:
851
- SYLogger.info(
852
- f"nacos:未找到相同版本({version_to_use})的实例,筛选出 {len(no_version_instances)} 个无版本号的实例")
853
- return no_version_instances
854
-
855
- # 3. 如果没有指定版本或前两个规则都不满足,使用轮询方式选择所有健康实例
856
- SYLogger.info(
857
- f"nacos:使用轮询方式从 {len(all_instances)} 个实例中选择")
858
-
859
- # 线程安全地获取下一个轮询索引
860
- with self._round_robin_lock:
861
- selected_index = self._round_robin_index % len(all_instances)
862
- # 更新轮询索引,为下一次请求做准备
863
- self._round_robin_index = (
864
- selected_index + 1) % len(all_instances)
865
-
866
- # 返回包含当前选中实例的列表
867
- return [all_instances[selected_index]]
868
-
869
- except Exception as e:
870
- SYLogger.error(f"nacos:服务发现失败: {service_name}: {str(e)}")
871
- return []
151
+ return self.discovery.get_service_instances(service_name, group, target_version)