entari-plugin-hyw 3.3.7__py3-none-any.whl → 3.3.8__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of entari-plugin-hyw might be problematic. Click here for more details.

@@ -58,13 +58,11 @@ class HywConfig(BasicConfModel):
58
58
  base_url: str = "https://openrouter.ai/api/v1"
59
59
  vision_model_name: Optional[str] = None
60
60
  vision_api_key: Optional[str] = None
61
+ language: str = "Simplified Chinese"
61
62
  vision_base_url: Optional[str] = None
62
- vision_system_prompt: Optional[str] = None
63
- intruct_model_name: Optional[str] = None
64
- intruct_api_key: Optional[str] = None
65
- intruct_base_url: Optional[str] = None
66
- intruct_system_prompt: Optional[str] = None
67
- agent_system_prompt: Optional[str] = None
63
+ instruct_model_name: Optional[str] = None
64
+ instruct_api_key: Optional[str] = None
65
+ instruct_base_url: Optional[str] = None
68
66
  search_base_url: str = "https://lite.duckduckgo.com/lite/?q={query}"
69
67
  image_search_base_url: str = "https://duckduckgo.com/?q={query}&iax=images&ia=images"
70
68
  headless: bool = False
@@ -72,8 +70,10 @@ class HywConfig(BasicConfModel):
72
70
  icon: str = "openai"
73
71
  render_timeout_ms: int = 6000
74
72
  extra_body: Optional[Dict[str, Any]] = None
73
+ vision_extra_body: Optional[Dict[str, Any]] = None
74
+ instruct_extra_body: Optional[Dict[str, Any]] = None
75
75
  enable_browser_fallback: bool = False
76
- reaction: bool = True
76
+ reaction: bool = False
77
77
  quote: bool = True
78
78
  temperature: float = 0.4
79
79
  # Billing configuration (price per million tokens)
@@ -83,14 +83,14 @@ class HywConfig(BasicConfModel):
83
83
  vision_input_price: Optional[float] = None
84
84
  vision_output_price: Optional[float] = None
85
85
  # Instruct model pricing overrides (defaults to main model pricing if not set)
86
- intruct_input_price: Optional[float] = None
87
- intruct_output_price: Optional[float] = None
86
+ instruct_input_price: Optional[float] = None
87
+ instruct_output_price: Optional[float] = None
88
88
  # Provider Names
89
89
  search_name: str = "DuckDuckGo"
90
90
  search_provider: str = "crawl4ai" # crawl4ai | httpx | ddgs
91
91
  model_provider: Optional[str] = None
92
92
  vision_model_provider: Optional[str] = None
93
- intruct_model_provider: Optional[str] = None
93
+ instruct_model_provider: Optional[str] = None
94
94
 
95
95
 
96
96
 
Binary file
@@ -12,27 +12,27 @@ class HYWConfig:
12
12
  fusion_mode: bool = False
13
13
  save_conversation: bool = False
14
14
  headless: bool = True
15
- intruct_model_name: Optional[str] = None
16
- intruct_api_key: Optional[str] = None
17
- intruct_base_url: Optional[str] = None
15
+ instruct_model_name: Optional[str] = None
16
+ instruct_api_key: Optional[str] = None
17
+ instruct_base_url: Optional[str] = None
18
18
  search_base_url: str = "https://lite.duckduckgo.com/lite/?q={query}"
19
19
  image_search_base_url: str = "https://duckduckgo.com/?q={query}&iax=images&ia=images"
20
20
  search_params: Optional[str] = None # e.g. "&kl=cn-zh" for China region
21
21
  search_limit: int = 8
22
22
  extra_body: Optional[Dict[str, Any]] = None
23
+ vision_extra_body: Optional[Dict[str, Any]] = None
24
+ instruct_extra_body: Optional[Dict[str, Any]] = None
23
25
  temperature: float = 0.4
24
26
  max_turns: int = 10
25
27
  icon: str = "openai" # logo for primary model
26
28
  vision_icon: Optional[str] = None # logo for vision model (falls back to icon when absent)
27
29
  instruct_icon: Optional[str] = None # logo for instruct model
28
30
  enable_browser_fallback: bool = False
29
- vision_system_prompt: Optional[str] = None
30
- intruct_system_prompt: Optional[str] = None
31
- agent_system_prompt: Optional[str] = None
31
+ language: str = "Simplified Chinese"
32
32
  input_price: Optional[float] = None # $ per 1M input tokens
33
33
  output_price: Optional[float] = None # $ per 1M output tokens
34
34
  vision_input_price: Optional[float] = None
35
35
  vision_output_price: Optional[float] = None
36
- intruct_input_price: Optional[float] = None
37
- intruct_output_price: Optional[float] = None
36
+ instruct_input_price: Optional[float] = None
37
+ instruct_output_price: Optional[float] = None
38
38
 
@@ -12,14 +12,14 @@ from .config import HYWConfig
12
12
  from ..utils.search import SearchService
13
13
  from ..utils.prompts import (
14
14
  AGENT_SP,
15
- AGENT_SP_INTRUCT_VISION_ADD,
15
+ AGENT_SP_INSTRUCT_VISION_ADD,
16
16
  AGENT_SP_TOOLS_STANDARD_ADD,
17
17
  AGENT_SP_TOOLS_AGENT_ADD,
18
18
  AGENT_SP_SEARCH_ADD,
19
19
  AGENT_SP_PAGE_ADD,
20
20
  AGENT_SP_IMAGE_SEARCH_ADD,
21
- INTRUCT_SP,
22
- INTRUCT_SP_VISION_ADD,
21
+ INSTRUCT_SP,
22
+ INSTRUCT_SP_VISION_ADD,
23
23
  VISION_SP,
24
24
  )
25
25
 
@@ -109,7 +109,7 @@ class ProcessingPipeline:
109
109
  ) -> Dict[str, Any]:
110
110
  """
111
111
  1) Vision: summarize images once (no image persistence).
112
- 2) Intruct: run web_search and decide whether to grant Playwright MCP tools.
112
+ 2) Instruct: run web_search and decide whether to grant Playwright MCP tools.
113
113
  3) Agent: normally no tools; if granted, allow Playwright MCP tools (max 6 rounds; step 5 nudge, step 6 forced).
114
114
  """
115
115
  start_time = time.time()
@@ -133,7 +133,7 @@ class ProcessingPipeline:
133
133
 
134
134
  trace: Dict[str, Any] = {
135
135
  "vision": None,
136
- "intruct": None,
136
+ "instruct": None,
137
137
  "agent": None,
138
138
  }
139
139
 
@@ -150,8 +150,7 @@ class ProcessingPipeline:
150
150
  or getattr(self.config, "vision_model_name", None)
151
151
  or active_model
152
152
  )
153
- vision_prompt_tpl = getattr(self.config, "vision_system_prompt", None) or VISION_SP
154
- vision_prompt = vision_prompt_tpl.format(user_msgs=user_input or "[图片]")
153
+ vision_prompt = VISION_SP.format(user_msgs=user_input or "[图片]")
155
154
  vision_text, vision_usage = await self._run_vision_stage(
156
155
  user_input=user_input,
157
156
  images=images,
@@ -182,10 +181,10 @@ class ProcessingPipeline:
182
181
  "cost": vision_cost
183
182
  }
184
183
 
185
- # Intruct + pre-search
184
+ # Instruct + pre-search
186
185
  instruct_start = time.time()
187
- instruct_model = getattr(self.config, "intruct_model_name", None) or active_model
188
- instruct_text, search_payloads, intruct_trace, intruct_usage, search_time = await self._run_instruct_stage(
186
+ instruct_model = getattr(self.config, "instruct_model_name", None) or active_model
187
+ instruct_text, search_payloads, instruct_trace, instruct_usage, search_time = await self._run_instruct_stage(
189
188
  user_input=user_input,
190
189
  vision_text=vision_text,
191
190
  model=instruct_model,
@@ -194,24 +193,24 @@ class ProcessingPipeline:
194
193
 
195
194
  # Calculate Instruct Cost
196
195
  instruct_cost = 0.0
197
- i_in_price = float(getattr(self.config, "intruct_input_price", None) or getattr(self.config, "input_price", 0.0) or 0.0)
198
- i_out_price = float(getattr(self.config, "intruct_output_price", None) or getattr(self.config, "output_price", 0.0) or 0.0)
196
+ i_in_price = float(getattr(self.config, "instruct_input_price", None) or getattr(self.config, "input_price", 0.0) or 0.0)
197
+ i_out_price = float(getattr(self.config, "instruct_output_price", None) or getattr(self.config, "output_price", 0.0) or 0.0)
199
198
  if i_in_price > 0 or i_out_price > 0:
200
- instruct_cost = (intruct_usage.get("input_tokens", 0) / 1_000_000 * i_in_price) + (intruct_usage.get("output_tokens", 0) / 1_000_000 * i_out_price)
199
+ instruct_cost = (instruct_usage.get("input_tokens", 0) / 1_000_000 * i_in_price) + (instruct_usage.get("output_tokens", 0) / 1_000_000 * i_out_price)
201
200
 
202
201
  # Add instruct usage
203
- usage_totals["input_tokens"] += intruct_usage.get("input_tokens", 0)
204
- usage_totals["output_tokens"] += intruct_usage.get("output_tokens", 0)
202
+ usage_totals["input_tokens"] += instruct_usage.get("input_tokens", 0)
203
+ usage_totals["output_tokens"] += instruct_usage.get("output_tokens", 0)
205
204
 
206
- intruct_trace["time"] = instruct_time
207
- intruct_trace["cost"] = instruct_cost
208
- trace["intruct"] = intruct_trace
205
+ instruct_trace["time"] = instruct_time
206
+ instruct_trace["cost"] = instruct_cost
207
+ trace["instruct"] = instruct_trace
209
208
 
210
209
  # Start agent loop
211
210
  agent_start_time = time.time()
212
211
  current_history.append({"role": "user", "content": user_input or "..."})
213
212
 
214
- mode = intruct_trace.get("mode", self.current_mode).lower()
213
+ mode = instruct_trace.get("mode", self.current_mode).lower()
215
214
  logger.success(f"Instruct Mode: {mode}")
216
215
  self.current_mode = mode
217
216
 
@@ -255,18 +254,17 @@ class ProcessingPipeline:
255
254
  has_image_results = any(r.get("_type") == "image" for r in self.all_web_results)
256
255
 
257
256
  # Build agent system prompt
258
- agent_prompt_tpl = getattr(self.config, "agent_system_prompt", None) or AGENT_SP
259
-
260
257
  mode_desc_text = AGENT_SP_TOOLS_AGENT_ADD.format(tools_desc=tools_desc) if mode == "agent" else AGENT_SP_TOOLS_STANDARD_ADD
261
- system_prompt = agent_prompt_tpl.format(
258
+ system_prompt = AGENT_SP.format(
262
259
  user_msgs=user_msgs_text,
263
260
  mode=mode,
264
- mode_desc=mode_desc_text
261
+ mode_desc=mode_desc_text,
262
+ language=getattr(self.config, "language", "Simplified Chinese")[:128]
265
263
  )
266
264
 
267
265
  # Append vision text if available
268
266
  if vision_text:
269
- system_prompt += AGENT_SP_INTRUCT_VISION_ADD.format(vision_msgs=vision_text)
267
+ system_prompt += AGENT_SP_INSTRUCT_VISION_ADD.format(vision_msgs=vision_text)
270
268
 
271
269
  # Append search results
272
270
  if has_search_results and search_msgs_text:
@@ -299,6 +297,7 @@ class ProcessingPipeline:
299
297
  model=active_model,
300
298
  tools=tools_for_step,
301
299
  tool_choice="auto" if tools_for_step else None,
300
+ extra_body=self.config.extra_body,
302
301
  )
303
302
  step_llm_time = time.time() - step_llm_start
304
303
 
@@ -366,8 +365,8 @@ class ProcessingPipeline:
366
365
  a_in_price = float(getattr(self.config, "input_price", 0.0) or 0.0)
367
366
  a_out_price = float(getattr(self.config, "output_price", 0.0) or 0.0)
368
367
 
369
- agent_input_tokens = usage_totals["input_tokens"] - vision_usage.get("input_tokens", 0) - intruct_usage.get("input_tokens", 0)
370
- agent_output_tokens = usage_totals["output_tokens"] - vision_usage.get("output_tokens", 0) - intruct_usage.get("output_tokens", 0)
368
+ agent_input_tokens = usage_totals["input_tokens"] - vision_usage.get("input_tokens", 0) - instruct_usage.get("input_tokens", 0)
369
+ agent_output_tokens = usage_totals["output_tokens"] - vision_usage.get("output_tokens", 0) - instruct_usage.get("output_tokens", 0)
371
370
 
372
371
  if a_in_price > 0 or a_out_price > 0:
373
372
  agent_cost = (max(0, agent_input_tokens) / 1_000_000 * a_in_price) + (max(0, agent_output_tokens) / 1_000_000 * a_out_price)
@@ -436,14 +435,14 @@ class ProcessingPipeline:
436
435
  "cost": v.get("cost", 0.0)
437
436
  })
438
437
 
439
- if trace.get("intruct"):
440
- i = trace["intruct"]
438
+ if trace.get("instruct"):
439
+ i = trace["instruct"]
441
440
  i_model = i.get("model", "")
442
441
  i_base_url = i.get("base_url", "") or self.config.base_url
443
442
  stages_used.append({
444
443
  "name": "Instruct",
445
444
  "model": i_model,
446
- "icon_config": getattr(self.config, "instruct_icon", None) or getattr(self.config, "intruct_icon", None) or infer_icon(i_model, i_base_url),
445
+ "icon_config": getattr(self.config, "instruct_icon", None) or infer_icon(i_model, i_base_url),
447
446
  "provider": infer_provider(i_base_url),
448
447
  "time": i.get("time", 0),
449
448
  "cost": i.get("cost", 0.0)
@@ -460,9 +459,9 @@ class ProcessingPipeline:
460
459
  })
461
460
 
462
461
  # Add Crawler stage if Instruct used crawl_page
463
- if trace.get("intruct"):
464
- intruct_tool_calls = trace["intruct"].get("tool_calls", [])
465
- crawl_calls = [tc for tc in intruct_tool_calls if tc.get("name") == "crawl_page"]
462
+ if trace.get("instruct"):
463
+ instruct_tool_calls = trace["instruct"].get("tool_calls", [])
464
+ crawl_calls = [tc for tc in instruct_tool_calls if tc.get("name") == "crawl_page"]
466
465
  if crawl_calls:
467
466
  # Build crawled_pages list for UI
468
467
  crawled_pages = []
@@ -828,10 +827,10 @@ class ProcessingPipeline:
828
827
  return f"Unknown tool {name}"
829
828
 
830
829
 
831
- async def _safe_llm_call(self, messages, model, tools=None, tool_choice=None, client: Optional[AsyncOpenAI] = None):
830
+ async def _safe_llm_call(self, messages, model, tools=None, tool_choice=None, client: Optional[AsyncOpenAI] = None, extra_body: Optional[Dict[str, Any]] = None):
832
831
  try:
833
832
  return await asyncio.wait_for(
834
- self._do_llm_request(messages, model, tools, tool_choice, client=client or self.client),
833
+ self._do_llm_request(messages, model, tools, tool_choice, client=client or self.client, extra_body=extra_body),
835
834
  timeout=120.0,
836
835
  )
837
836
  except asyncio.TimeoutError:
@@ -841,7 +840,7 @@ class ProcessingPipeline:
841
840
  logger.error(f"LLM Call Failed: {e}")
842
841
  return type("obj", (object,), {"content": f"Error: Model failure ({e})", "tool_calls": None})(), {"input_tokens": 0, "output_tokens": 0}
843
842
 
844
- async def _do_llm_request(self, messages, model, tools, tool_choice, client: AsyncOpenAI):
843
+ async def _do_llm_request(self, messages, model, tools, tool_choice, client: AsyncOpenAI, extra_body: Optional[Dict[str, Any]] = None):
845
844
  try:
846
845
  payload_debug = json.dumps(messages)
847
846
  logger.info(f"LLM Request Payload Size: {len(payload_debug)} chars")
@@ -856,6 +855,7 @@ class ProcessingPipeline:
856
855
  tools=tools,
857
856
  tool_choice=tool_choice,
858
857
  temperature=self.config.temperature,
858
+ extra_body=extra_body,
859
859
  )
860
860
  logger.info(f"LLM Request RECEIVED after {time.time() - t0:.2f}s")
861
861
 
@@ -880,6 +880,7 @@ class ProcessingPipeline:
880
880
  messages=[{"role": "system", "content": prompt}, {"role": "user", "content": content_payload}],
881
881
  model=model,
882
882
  client=client,
883
+ extra_body=getattr(self.config, "vision_extra_body", None),
883
884
  )
884
885
  return (response.content or "").strip(), usage
885
886
 
@@ -891,15 +892,14 @@ class ProcessingPipeline:
891
892
  tools = [self.web_search_tool, self.image_search_tool, self.set_mode_tool, self.crawl_page_tool]
892
893
  tools_desc = "- internal_web_search: 搜索文本\n- internal_image_search: 搜索图片\n- crawl_page: 获取网页内容\n- set_mode: 设定standard/agent模式"
893
894
 
894
- prompt_tpl = getattr(self.config, "intruct_system_prompt", None) or INTRUCT_SP
895
- prompt = prompt_tpl.format(user_msgs=user_input or "", tools_desc=tools_desc)
895
+ prompt = INSTRUCT_SP.format(user_msgs=user_input or "", tools_desc=tools_desc)
896
896
 
897
897
  if vision_text:
898
- prompt = f"{prompt}\\n\\n{INTRUCT_SP_VISION_ADD.format(vision_msgs=vision_text)}"
898
+ prompt = f"{prompt}\\n\\n{INSTRUCT_SP_VISION_ADD.format(vision_msgs=vision_text)}"
899
899
 
900
900
  client = self._client_for(
901
- api_key=getattr(self.config, "intruct_api_key", None),
902
- base_url=getattr(self.config, "intruct_base_url", None),
901
+ api_key=getattr(self.config, "instruct_api_key", None),
902
+ base_url=getattr(self.config, "instruct_base_url", None),
903
903
  )
904
904
 
905
905
  history: List[Dict[str, Any]] = [
@@ -913,12 +913,13 @@ class ProcessingPipeline:
913
913
  tools=tools,
914
914
  tool_choice="auto",
915
915
  client=client,
916
+ extra_body=getattr(self.config, "instruct_extra_body", None),
916
917
  )
917
918
 
918
919
  search_payloads: List[str] = []
919
- intruct_trace: Dict[str, Any] = {
920
+ instruct_trace: Dict[str, Any] = {
920
921
  "model": model,
921
- "base_url": getattr(self.config, "intruct_base_url", None) or self.config.base_url,
922
+ "base_url": getattr(self.config, "instruct_base_url", None) or self.config.base_url,
922
923
  "prompt": prompt,
923
924
  "user_input": user_input or "",
924
925
  "vision_add": vision_text or "",
@@ -946,8 +947,8 @@ class ProcessingPipeline:
946
947
  history.append(
947
948
  {"tool_call_id": tc.id, "role": "tool", "name": tc.function.name, "content": str(result)}
948
949
  )
949
- intruct_trace["tool_calls"].append(self._tool_call_to_trace(tc))
950
- intruct_trace["tool_results"].append({"name": tc.function.name, "content": str(result)})
950
+ instruct_trace["tool_calls"].append(self._tool_call_to_trace(tc))
951
+ instruct_trace["tool_results"].append({"name": tc.function.name, "content": str(result)})
951
952
 
952
953
  if tc.function.name in ["web_search", "internal_web_search"]:
953
954
  search_payloads.append(str(result))
@@ -959,18 +960,18 @@ class ProcessingPipeline:
959
960
  mode = args.get("mode", mode)
960
961
  mode_reason = args.get("reason", "")
961
962
 
962
- intruct_trace["mode"] = mode
963
+ instruct_trace["mode"] = mode
963
964
  if mode_reason:
964
- intruct_trace["mode_reason"] = mode_reason
965
+ instruct_trace["mode_reason"] = mode_reason
965
966
 
966
- intruct_trace["output"] = ""
967
- intruct_trace["usage"] = usage
968
- return "", search_payloads, intruct_trace, usage, search_time
967
+ instruct_trace["output"] = ""
968
+ instruct_trace["usage"] = usage
969
+ return "", search_payloads, instruct_trace, usage, search_time
969
970
 
970
- intruct_trace["mode"] = mode
971
- intruct_trace["output"] = (response.content or "").strip()
972
- intruct_trace["usage"] = usage
973
- return "", search_payloads, intruct_trace, usage, 0.0
971
+ instruct_trace["mode"] = mode
972
+ instruct_trace["output"] = (response.content or "").strip()
973
+ instruct_trace["usage"] = usage
974
+ return "", search_payloads, instruct_trace, usage, 0.0
974
975
 
975
976
  def _format_search_msgs(self) -> str:
976
977
  """Format search snippets only (not crawled pages)."""
@@ -1050,9 +1051,9 @@ class ProcessingPipeline:
1050
1051
  parts.append(fence("text", v.get("output", "")))
1051
1052
  parts.append("")
1052
1053
 
1053
- if trace.get("intruct"):
1054
- t = trace["intruct"]
1055
- parts.append("## Intruct\n")
1054
+ if trace.get("instruct"):
1055
+ t = trace["instruct"]
1056
+ parts.append("## Instruct\n")
1056
1057
  parts.append(f"- model: `{t.get('model')}`")
1057
1058
  parts.append(f"- base_url: `{t.get('base_url')}`\n")
1058
1059
  parts.append("### Prompt\n")
@@ -1,121 +1,121 @@
1
- VISION_SP = """# 你是一个专业的视觉转文字专家.
1
+ VISION_SP = """# You are a professional vision-to-text expert.
2
2
 
3
- # 核心任务
4
- - 智能分析图片内容, 转述成文本, 除此之外不要添加任何内容
5
- - 文字优先: 若包含清晰文字(文档、截图等), 必须完整准确转录, 不要遗漏.
6
- - 视觉补充: 解释完文字后, 描述视觉内容总结(物体、场景、氛围).
7
- - 用户要求: 根据用户消息中提示侧重转文本的偏向, 若无关联则不理会.
3
+ # Core Tasks
4
+ - Intelligently analyze image content and paraphrase it into text. Do not add any other content.
5
+ - Text Priority: If there is clear text (documents, screenshots, etc.), it must be transcribed completely and accurately, without omission.
6
+ - Visual Supplement: After explaining the text, describe the visual content summary (objects, scenes, atmosphere).
7
+ - User Requirements: Focus on text transcription based on the hint in the user message, ignore if irrelevant.
8
8
 
9
- ## 用户消息
9
+ ## User Message
10
10
  ```text
11
11
  {user_msgs}
12
12
  ```
13
13
  """
14
14
 
15
- INTRUCT_SP = """# 你是一个专业的指导专家.
16
-
17
- ## 核心任务
18
- - 决定预处理工具:
19
- - 用户消息包含链接: 调用 crawl_page 获取内容, 无需其他工具
20
- - 用户消息包含典型名词、可能的专有名词组合: 调用 internal_web_search
21
- - 提炼出关键词搜索关键词本身, 不添加任何其他助词, 搜索效果最好
22
- - 如果用户消息关键词清晰, 使用图片搜索能搜索出诸如海报、地标、物品、角色立绘等, 调用 internal_image_search
23
- - 用户消息不需要搜索: 不调用工具
24
- - 调用 set_mode:
25
- - 绝大部分常规问题: standard
26
- - 用户要求研究/深度搜索: agent
27
- - 需要获取页面具体信息才能回答问题: agent
28
- > 所有工具需要在本次对话同时调用
29
-
30
- ## 调用工具
31
- - 使用工具时, 必须通过 function_call / tool_call 机制调用.
15
+ INSTRUCT_SP = """# You are a professional instruction expert.
16
+
17
+ ## Core Tasks
18
+ - Decide on preprocessing tools:
19
+ - User message contains a link: Call `crawl_page` to get content, no other tools needed.
20
+ - User message contains typical nouns or possible proper noun combinations: Call `internal_web_search`.
21
+ - Extract keywords to search for the keywords themselves, do not add any other particles, for best search results.
22
+ - If user message keywords are clear, and image search can find posters, landmarks, items, character drawings, etc., call `internal_image_search`.
23
+ - User message does not need search: Do not call tools.
24
+ - Call `set_mode`:
25
+ - Most routine questions: `standard`.
26
+ - User requests research / deep search: `agent`.
27
+ - Need to get specific page information to answer the question: `agent`.
28
+ > All tools need to be called simultaneously in this conversation.
29
+
30
+ ## Call Tools
31
+ - When using tools, you must call them via the `function_call` / `tool_call` mechanism.
32
32
  {tools_desc}
33
33
 
34
- ## 你的回复
35
- 调用工具后无需回复额外文本节省token.
34
+ ## Your Reply
35
+ Do not reply with extra text after calling tools to save tokens.
36
36
 
37
- ## 用户消息
37
+ ## User Message
38
38
  ```
39
39
  {user_msgs}
40
40
  ```
41
41
  """
42
42
 
43
43
 
44
- INTRUCT_SP_VISION_ADD = """
45
- ## 视觉专家消息
44
+ INSTRUCT_SP_VISION_ADD = """
45
+ ## Vision Expert Message
46
46
  ```text
47
47
  {vision_msgs}
48
48
  ```
49
49
  """
50
50
 
51
- AGENT_SP = """# 你是一个 Agent 总控专家, 你需要理解用户意图, 根据已有信息给出最终回复.
52
- > 请确保你输出的任何消息有着准确的来源, 减少输出错误信息.
53
-
54
- 当前模式: {mode}, {mode_desc}
55
-
56
-
57
-
58
- ## 过程要求
59
- 当不调用工具发送文本, 即会变成最终回复, 请遵守:
60
- - 直接给出一篇报告, 无需回答用户消息
61
- - 语言: 简体中文, 百科式风格, 语言严谨不啰嗦.
62
- - 正文格式:
63
- - 使用 Markdown 格式, 支持 hightlight, katex
64
- - 最开始给出`# `大标题, 不要有多余废话, 不要直接回答用户的提问.
65
- - 内容丰富突出重点.
66
- - 工具引用:
67
- > 重要: 所有正文内容必须基于实际信息, 保证百分百真实度
68
- - 引用规则:
69
- - 本次会话中存在对解决此问题有用的信息才加以引用, 不需要的消息可以不引用.
70
- - 角标必须真实对应上下文中获取的信息, 同时对应 references 中的内容, 图片按顺序对应.
71
- - 正文中的引用规则
72
- - 搜索摘要引用: 使用如 [search:3][search:4]
73
- - 页面内容引用: 使用如 [page:5][page:6]
74
- - 图片引用: 使用如 [image:7][image:8]
75
- - search 的意思是你使用 internal_web_search 获取的搜索摘要, 如果没有此工具相关信息则不引用
76
- - page 的意思是你使用 crawl_page 获取的页面内容, 如果没有此工具相关信息则不引用
77
- - image 的意思是你使用 internal_image_search 获取的图片, 图片按顺序摆放即可, 你无需显式引用
78
- - 在正文底部添加 references 代码块:
79
- - 用不到的条目不写, 没有专家给信息就不写.
51
+ AGENT_SP = """# You are an Agent Control Expert. You need to understand user intent and provide a final reply based on available information.
52
+ > Please ensure that any message you output has an accurate source to reduce misinformation.
53
+
54
+ Current Mode: {mode}, {mode_desc}
55
+
56
+
57
+
58
+ ## Process Requirements
59
+ When sending text without calling tools, it means this is the final reply. Please observe:
60
+ - Provide a report directly, no need to explicitly answer the user message.
61
+ - Language: {language}, encyclopedic style, rigorous and concise language.
62
+ - Body Format:
63
+ - Use Markdown format, supporting highlight, katex.
64
+ - Give a `# ` main title at the beginning, no extra nonsense, do not directly answer the user's question.
65
+ - Rich content highlighting key points.
66
+ - Tool Citation:
67
+ > Important: All body content must be based on actual information, ensuring 100% accuracy.
68
+ - Citation Rules:
69
+ - Cite information only if it is useful for solving the problem in this session; do not cite unnecessary messages.
70
+ - Badges must truly correspond to the information obtained in the context, and correspond to the content in references. Images correspond in order.
71
+ - Citation Rules in Body:
72
+ - Search Summary Citation: Use like `[search:3][search:4]`
73
+ - Page Content Citation: Use like `[page:5][page:6]`
74
+ - Image Citation: Use like `[image:7][image:8]`
75
+ - `search` means search summaries obtained using `internal_web_search`. Do not cite if no relevant info from this tool.
76
+ - `page` means page content obtained using `crawl_page`. Do not cite if no relevant info from this tool.
77
+ - `image` means images obtained using `internal_image_search`. Just place images in order, you do not need to explicitly cite.
78
+ - Add a `references` code block at the bottom of the body:
79
+ - Do not write unused entries. Do not write if experts gave no info.
80
80
  ```references
81
- [2] [search] [文本描述](url)
82
- [8] [search] [文本描述](url)
83
- [1] [page] [页面标题](url)
84
- [2] [page] [页面标题](url)
85
- [1] [image] [来源](url)
81
+ [2] [search] [Text Description](url)
82
+ [8] [search] [Text Description](url)
83
+ [1] [page] [Page Title](url)
84
+ [2] [page] [Page Title](url)
85
+ [1] [image] [Source](url)
86
86
  ```
87
87
 
88
- ## 用户消息
88
+ ## User Message
89
89
  ```text
90
90
  {user_msgs}
91
91
  ```
92
92
  """
93
93
 
94
94
  AGENT_SP_TOOLS_STANDARD_ADD = """
95
- 你需要整合已有的信息, 提炼用户消息中的关键词, 进行最终回复.
95
+ You need to integrate existing information, extract keywords from the user message, and make a final reply.
96
96
  """
97
97
 
98
98
 
99
99
  AGENT_SP_TOOLS_AGENT_ADD = """
100
- - 你现在可以使用工具: {tools_desc}
101
- - 你需要判断顺序或并发使用工具获取信息:
102
- - 0-1 internal_web_search
103
- - 0-1 internal_image_search (如果用户需要图片, 通常和 internal_web_search 并发执行)
104
- - 1-2 crawl_page
105
- - 使用工具时, 必须通过 function_call / tool_call 机制调用.
100
+ - You can now use tools: {tools_desc}
101
+ - You need to judge whether to use tools sequentially or concurrently to obtain information:
102
+ - 0-1 times `internal_web_search`
103
+ - 0-1 times `internal_image_search` (if user needs images, usually concurrent with `internal_web_search`)
104
+ - 1-2 times `crawl_page`
105
+ - When using tools, you must call them via the `function_call` / `tool_call` mechanism.
106
106
  """
107
107
 
108
108
 
109
109
 
110
- AGENT_SP_INTRUCT_VISION_ADD = """
111
- ## 视觉专家消息
110
+ AGENT_SP_INSTRUCT_VISION_ADD = """
111
+ ## Vision Expert Message
112
112
  ```text
113
113
  {vision_msgs}
114
114
  ```
115
115
  """
116
116
 
117
117
  AGENT_SP_SEARCH_ADD = """
118
- ## 搜索专家消息
118
+ ## Search Expert Message
119
119
  ```text
120
120
  {search_msgs}
121
121
  ```
@@ -124,17 +124,17 @@ AGENT_SP_SEARCH_ADD = """
124
124
  """
125
125
 
126
126
  AGENT_SP_PAGE_ADD = """
127
- ## 页面内容专家消息
127
+ ## Page Content Expert Message
128
128
  ```text
129
129
  {page_msgs}
130
130
  ```
131
- - 引用页面内容时, 必须使用 `page:id` 格式
131
+ - When citing page content, you must use the `page:id` format.
132
132
  """
133
133
 
134
134
  AGENT_SP_IMAGE_SEARCH_ADD = """
135
- ## 图像搜索专家消息
135
+ ## Image Search Expert Message
136
136
  ```text
137
137
  {image_search_msgs}
138
138
  ```
139
- - 每进行一次 internal_image_search, 挑选 1 张图像插入正文
139
+ - For every `internal_image_search` performed, pick 1 image to insert into the body.
140
140
  """
@@ -0,0 +1,140 @@
1
+ VISION_SP = """# 你是一个专业的视觉转文字专家.
2
+
3
+ # 核心任务
4
+ - 智能分析图片内容, 转述成文本, 除此之外不要添加任何内容
5
+ - 文字优先: 若包含清晰文字(文档、截图等), 必须完整准确转录, 不要遗漏.
6
+ - 视觉补充: 解释完文字后, 描述视觉内容总结(物体、场景、氛围).
7
+ - 用户要求: 根据用户消息中提示侧重转文本的偏向, 若无关联则不理会.
8
+
9
+ ## 用户消息
10
+ ```text
11
+ {user_msgs}
12
+ ```
13
+ """
14
+
15
+ INSTRUCT_SP = """# 你是一个专业的指导专家.
16
+
17
+ ## 核心任务
18
+ - 决定预处理工具:
19
+ - 用户消息包含链接: 调用 crawl_page 获取内容, 无需其他工具
20
+ - 用户消息包含典型名词、可能的专有名词组合: 调用 internal_web_search
21
+ - 提炼出关键词搜索关键词本身, 不添加任何其他助词, 搜索效果最好
22
+ - 如果用户消息关键词清晰, 使用图片搜索能搜索出诸如海报、地标、物品、角色立绘等, 调用 internal_image_search
23
+ - 用户消息不需要搜索: 不调用工具
24
+ - 调用 set_mode:
25
+ - 绝大部分常规问题: standard
26
+ - 用户要求研究/深度搜索: agent
27
+ - 需要获取页面具体信息才能回答问题: agent
28
+ > 所有工具需要在本次对话同时调用
29
+
30
+ ## 调用工具
31
+ - 使用工具时, 必须通过 function_call / tool_call 机制调用.
32
+ {tools_desc}
33
+
34
+ ## 你的回复
35
+ 调用工具后无需回复额外文本节省token.
36
+
37
+ ## 用户消息
38
+ ```
39
+ {user_msgs}
40
+ ```
41
+ """
42
+
43
+
44
+ INSTRUCT_SP_VISION_ADD = """
45
+ ## 视觉专家消息
46
+ ```text
47
+ {vision_msgs}
48
+ ```
49
+ """
50
+
51
+ AGENT_SP = """# 你是一个 Agent 总控专家, 你需要理解用户意图, 根据已有信息给出最终回复.
52
+ > 请确保你输出的任何消息有着准确的来源, 减少输出错误信息.
53
+
54
+ 当前模式: {mode}, {mode_desc}
55
+
56
+
57
+
58
+ ## 过程要求
59
+ 当不调用工具发送文本, 即会变成最终回复, 请遵守:
60
+ - 直接给出一篇报告, 无需回答用户消息
61
+ - 语言: {language}, 百科式风格, 语言严谨不啰嗦.
62
+ - 正文格式:
63
+ - 使用 Markdown 格式, 支持 hightlight, katex
64
+ - 最开始给出`# `大标题, 不要有多余废话, 不要直接回答用户的提问.
65
+ - 内容丰富突出重点.
66
+ - 工具引用:
67
+ > 重要: 所有正文内容必须基于实际信息, 保证百分百真实度
68
+ - 引用规则:
69
+ - 本次会话中存在对解决此问题有用的信息才加以引用, 不需要的消息可以不引用.
70
+ - 角标必须真实对应上下文中获取的信息, 同时对应 references 中的内容, 图片按顺序对应.
71
+ - 正文中的引用规则
72
+ - 搜索摘要引用: 使用如 [search:3][search:4]
73
+ - 页面内容引用: 使用如 [page:5][page:6]
74
+ - 图片引用: 使用如 [image:7][image:8]
75
+ - search 的意思是你使用 internal_web_search 获取的搜索摘要, 如果没有此工具相关信息则不引用
76
+ - page 的意思是你使用 crawl_page 获取的页面内容, 如果没有此工具相关信息则不引用
77
+ - image 的意思是你使用 internal_image_search 获取的图片, 图片按顺序摆放即可, 你无需显式引用
78
+ - 在正文底部添加 references 代码块:
79
+ - 用不到的条目不写, 没有专家给信息就不写.
80
+ ```references
81
+ [2] [search] [文本描述](url)
82
+ [8] [search] [文本描述](url)
83
+ [1] [page] [页面标题](url)
84
+ [2] [page] [页面标题](url)
85
+ [1] [image] [来源](url)
86
+ ```
87
+
88
+ ## 用户消息
89
+ ```text
90
+ {user_msgs}
91
+ ```
92
+ """
93
+
94
+ AGENT_SP_TOOLS_STANDARD_ADD = """
95
+ 你需要整合已有的信息, 提炼用户消息中的关键词, 进行最终回复.
96
+ """
97
+
98
+
99
+ AGENT_SP_TOOLS_AGENT_ADD = """
100
+ - 你现在可以使用工具: {tools_desc}
101
+ - 你需要判断顺序或并发使用工具获取信息:
102
+ - 0-1 次 internal_web_search
103
+ - 0-1 次 internal_image_search (如果用户需要图片, 通常和 internal_web_search 并发执行)
104
+ - 1-2 次 crawl_page
105
+ - 使用工具时, 必须通过 function_call / tool_call 机制调用.
106
+ """
107
+
108
+
109
+
110
+ AGENT_SP_INSTRUCT_VISION_ADD = """
111
+ ## 视觉专家消息
112
+ ```text
113
+ {vision_msgs}
114
+ ```
115
+ """
116
+
117
+ AGENT_SP_SEARCH_ADD = """
118
+ ## 搜索专家消息
119
+ ```text
120
+ {search_msgs}
121
+ ```
122
+
123
+
124
+ """
125
+
126
+ AGENT_SP_PAGE_ADD = """
127
+ ## 页面内容专家消息
128
+ ```text
129
+ {page_msgs}
130
+ ```
131
+ - 引用页面内容时, 必须使用 `page:id` 格式
132
+ """
133
+
134
+ AGENT_SP_IMAGE_SEARCH_ADD = """
135
+ ## 图像搜索专家消息
136
+ ```text
137
+ {image_search_msgs}
138
+ ```
139
+ - 每进行一次 internal_image_search, 挑选 1 张图像插入正文
140
+ """
@@ -0,0 +1,113 @@
1
+ Metadata-Version: 2.4
2
+ Name: entari_plugin_hyw
3
+ Version: 3.3.8
4
+ Summary: Use large language models to interpret chat messages
5
+ Author-email: kumoSleeping <zjr2992@outlook.com>
6
+ License: MIT
7
+ Project-URL: Homepage, https://github.com/kumoSleeping/entari-plugin-hyw
8
+ Project-URL: Repository, https://github.com/kumoSleeping/entari-plugin-hyw
9
+ Project-URL: Issue Tracker, https://github.com/kumoSleeping/entari-plugin-hyw/issues
10
+ Keywords: entari,llm,ai,bot,chat
11
+ Classifier: Development Status :: 3 - Alpha
12
+ Classifier: Intended Audience :: Developers
13
+ Classifier: License :: OSI Approved :: MIT License
14
+ Classifier: Programming Language :: Python :: 3.10
15
+ Classifier: Programming Language :: Python :: 3.11
16
+ Classifier: Programming Language :: Python :: 3.12
17
+ Requires-Python: >=3.10
18
+ Description-Content-Type: text/markdown
19
+ Requires-Dist: arclet-entari[full]>=0.16.5
20
+ Requires-Dist: openai
21
+ Requires-Dist: httpx
22
+ Requires-Dist: markdown>=3.10
23
+ Requires-Dist: crawl4ai>=0.7.8
24
+ Requires-Dist: jinja2>=3.0
25
+ Requires-Dist: ddgs>=9.10.0
26
+ Provides-Extra: dev
27
+ Requires-Dist: entari-plugin-server>=0.5.0; extra == "dev"
28
+ Requires-Dist: satori-python-adapter-onebot11>=0.2.5; extra == "dev"
29
+
30
+ # Entari Plugin HYW
31
+
32
+ [![PyPI version](https://badge.fury.io/py/entari-plugin-hyw.svg)](https://badge.fury.io/py/entari-plugin-hyw)
33
+ [![License: MIT](https://img.shields.io/badge/License-MIT-yellow.svg)](https://opensource.org/licenses/MIT)
34
+ [![Python Versions](https://img.shields.io/pypi/pyversions/entari-plugin-hyw.svg)](https://pypi.org/project/entari-plugin-hyw/)
35
+
36
+ **English** | [简体中文](docs/README_CN.md)
37
+
38
+ **Entari Plugin HYW** is an advanced agentic chat plugin for the [Entari](https://github.com/entari-org/entari) framework. It leverages Large Language Models (LLMs) to provide intelligent, context-aware, and multi-modal responses within instant messaging environments (OneBot 11, Satori).
39
+
40
+ The plugin implements a three-stage pipeline (**Vision**, **Instruct**, **Agent**) to autonomously decide when to search the web, crawl pages, or analyze images to answer user queries effectively.
41
+
42
+ <p align="center">
43
+ <img src="docs/demo_mockup.svg" width="800" />
44
+ </p>
45
+
46
+ ## Features
47
+
48
+ - 📖 **Agentic Workflow**
49
+ Autonomous decision-making process to search, browse, and reason.
50
+
51
+ - 🎑 **Multi-Modal Support**
52
+ Native support for image analysis using Vision Language Models (VLMs).
53
+
54
+ - 🔍 **Web Search & Crawling**
55
+ Integrated **DuckDuckGo** and **Crawl4AI** for real-time information retrieval.
56
+
57
+ - 🎨 **Rich Rendering**
58
+ Responses are rendered as images containing Markdown, syntax-highlighted code, LaTeX math, and citation badges.
59
+
60
+ - 🔌 **Protocol Support**
61
+ Deep integration with OneBot 11 and Satori protocols, handling reply context and JSON cards perfectly.
62
+
63
+ ## Installation
64
+
65
+ ```bash
66
+ pip install entari-plugin-hyw
67
+ ```
68
+
69
+ ## Configuration
70
+
71
+ Configure the plugin in your `entari.yml`.
72
+
73
+ ### Minimal Configuration
74
+
75
+ ```yaml
76
+ plugins:
77
+ entari_plugin_hyw:
78
+ model_name: google/gemini-3-flash-preview
79
+ api_key: "your-or-api-key-here"
80
+ ```
81
+
82
+ ## Usage
83
+
84
+ ### Commands
85
+
86
+ - **Text Query**
87
+ ```text
88
+ /q What's the latest news on Rust 1.83?
89
+ ```
90
+
91
+ - **Image Analysis**
92
+ *(Send an image with command, or reply to an image)*
93
+ ```text
94
+ /q [Image] Explain this error.
95
+ ```
96
+ - **Quote Query**
97
+ ```text
98
+ [quote: User Message] /q
99
+ ```
100
+
101
+ - **Follow-up**
102
+ *Reply to the bot's message to continue the conversation.*
103
+
104
+ ## Documentation for AI/LLMs
105
+
106
+ - [Instruction Guide (English)](docs/README_LLM_EN.md)
107
+ - [指导手册 (简体中文)](docs/README_LLM_CN.md)
108
+
109
+ ---
110
+
111
+ ## License
112
+
113
+ This project is licensed under the MIT License.
@@ -1,4 +1,4 @@
1
- entari_plugin_hyw/__init__.py,sha256=K5WW4usKpP38CTxQHpm693brIhsbxBRsD0ojwekmMGE,19689
1
+ entari_plugin_hyw/__init__.py,sha256=BwlY42IJj51Oo8hHrTxbCDItRA3bMr7Z1G-3HUEyWhQ,19708
2
2
  entari_plugin_hyw/assets/package-lock.json,sha256=TIrLM-wLWZTrp3LKfzhEVuduhvBJmI93NdQEKYLW2W0,33172
3
3
  entari_plugin_hyw/assets/package.json,sha256=Y4H8JGtp3nv2WUtI20tXoXWddR-dwwKJhqQVLercpiw,306
4
4
  entari_plugin_hyw/assets/tailwind.config.js,sha256=S8I9X8hI8IaQRczWK9hTW-zl4oVpAXw5ykeksrzHjpU,382
@@ -11,6 +11,7 @@ entari_plugin_hyw/assets/icon/deepseek.png,sha256=KWWAr9aeYMc6I07U_1qo7zcXO6e7-k
11
11
  entari_plugin_hyw/assets/icon/gemini.svg,sha256=H74CoVmx5opcCtr3Ay3M09dpqL9cd9Whkx-M6an3t7s,599
12
12
  entari_plugin_hyw/assets/icon/google.svg,sha256=H74CoVmx5opcCtr3Ay3M09dpqL9cd9Whkx-M6an3t7s,599
13
13
  entari_plugin_hyw/assets/icon/grok.png,sha256=uSulvvDVqoA4RUOW0ZAkdvBVM2rpyGJRZIbn5dEFspw,362
14
+ entari_plugin_hyw/assets/icon/huggingface.png,sha256=8eAudeftUDO11jf0coOscPeRkskCb7l9TNMx78q61mY,24564
14
15
  entari_plugin_hyw/assets/icon/microsoft.svg,sha256=-am_6N3UEQYSzldDg-xrdGYjTWsagH-3v4Q_eia1ymE,684
15
16
  entari_plugin_hyw/assets/icon/minimax.png,sha256=tWqVlMdFNPpP8zWWX9tvIsWXI9q76P7O3t3CEZO7NU0,1525
16
17
  entari_plugin_hyw/assets/icon/mistral.png,sha256=0vv7jPmPKiBRYVYYJxVL_wIH_qa_ZssIdV3NDO5vbmk,869
@@ -20,6 +21,7 @@ entari_plugin_hyw/assets/icon/openrouter.png,sha256=exxfjWGDWpYH-Vc8xJDbhNVeXFEV
20
21
  entari_plugin_hyw/assets/icon/perplexity.svg,sha256=mHWZFoeWmDYXOIDzm9pj6_sRotaI8xNy5Lkeg5Vzu70,555
21
22
  entari_plugin_hyw/assets/icon/qwen.png,sha256=eqLbnIPbjh2_PsODU_mmqjeD82xXj8fV_kN0fDrNaD0,38419
22
23
  entari_plugin_hyw/assets/icon/xai.png,sha256=uSulvvDVqoA4RUOW0ZAkdvBVM2rpyGJRZIbn5dEFspw,362
24
+ entari_plugin_hyw/assets/icon/xiaomi.png,sha256=WHxlDFGU5FCjb-ure3ngdGG18-efYZUUfqA3_lqCUN0,4084
23
25
  entari_plugin_hyw/assets/icon/zai.png,sha256=K-gnabdsjMLInppHA1Op7Nyt33iegrx1x-yNlvCZ0Tc,2351
24
26
  entari_plugin_hyw/assets/libs/highlight.css,sha256=Oppd74ucMR5a5Dq96FxjEzGF7tTw2fZ_6ksAqDCM8GY,1309
25
27
  entari_plugin_hyw/assets/libs/highlight.js,sha256=g3pvpbDHNrUrveKythkPMF2j_J7UFoHbUyFQcFe1yEY,121727
@@ -28,18 +30,19 @@ entari_plugin_hyw/assets/libs/katex.css,sha256=UF1fgpAiu3tPJN_uCqEUHNe7pnr-QR0SQ
28
30
  entari_plugin_hyw/assets/libs/katex.js,sha256=3ISyluw-iE3gkxWPdg_Z1Ftser5YtTgVV_ThOPRqWK4,277038
29
31
  entari_plugin_hyw/assets/libs/tailwind.css,sha256=ee_3txpnxhChZOjSJQUX0XiL1Nq0U2KLTvSGJLZBlaA,19916
30
32
  entari_plugin_hyw/core/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
31
- entari_plugin_hyw/core/config.py,sha256=rN2hVI964D7eM6xPuOthEIpXyFGZpRSYNrl1xdKHJ1s,1636
33
+ entari_plugin_hyw/core/config.py,sha256=uKZOuK9bG1W-E5UzhKX-EcYu2nFdxfl9EEaSwVgFtK4,1653
32
34
  entari_plugin_hyw/core/history.py,sha256=vqp7itwR5-KaqC4Ftmq6GOz7OM9GsiFJnSN9JJ2P6L4,5894
33
35
  entari_plugin_hyw/core/hyw.py,sha256=RCRjV9uYmvXysiliztphLP3VyUabrf0LY2Bk66W5JGA,1927
34
- entari_plugin_hyw/core/pipeline.py,sha256=t1nIjQlMKqTb7wpY7Dn1rbWDD2kl8WWUnPQBY5MQO4E,49071
36
+ entari_plugin_hyw/core/pipeline.py,sha256=6fA59ObZSV7Cb0mluOumpXve0m0WFGFgAopHVRgbah4,49197
35
37
  entari_plugin_hyw/core/render.py,sha256=rUhv2R5fdtsMIGg-Q1qe8hhUWC1_E50BODLA78u4_SI,28948
36
38
  entari_plugin_hyw/utils/__init__.py,sha256=TnkxDqYr0zgRE7TC92tVbUaY8m1UyyoLg2zvzQ8nMVI,84
37
39
  entari_plugin_hyw/utils/browser.py,sha256=LJlFh-oSqt9mQBpMALxbYGUG__t1YLUo7RxUAslsWUc,1416
38
40
  entari_plugin_hyw/utils/misc.py,sha256=_7iHVYj_mJ6OGq6FU1s_cFeS1Ao-neBjZYd6eI2p95U,3482
39
41
  entari_plugin_hyw/utils/playwright_tool.py,sha256=ZZNkzFtUt_Gxny3Od4boBAgNF9J0N84uySatzn1Bwe4,1272
40
- entari_plugin_hyw/utils/prompts.py,sha256=oJpgNvRQ_Lmr2Ca-B6fcpysMT2i0obioBC1DuH_Z1MY,4430
42
+ entari_plugin_hyw/utils/prompts.py,sha256=eybCtSuW4F13jQtleHXF6CQypCIIutDT7mpbkXS48Gs,4993
43
+ entari_plugin_hyw/utils/prompts_cn.py,sha256=87ti20ofjc8QW3i8HaPCUpDfl0EsS-ynz78e4tCz4Cg,4431
41
44
  entari_plugin_hyw/utils/search.py,sha256=Bvz2KFw3Gr2nuvmlo_8ExLHvO353NKX-YN35A2FCsBw,19047
42
- entari_plugin_hyw-3.3.7.dist-info/METADATA,sha256=ZQ_HfsEQKXUPkEf2KaPSO9hPm1bYgHSfCo-GRV-f9l8,6340
43
- entari_plugin_hyw-3.3.7.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
44
- entari_plugin_hyw-3.3.7.dist-info/top_level.txt,sha256=TIDsn6XPs6KA5e3ezsE65JoXsy03ejDdrB41I4SPjmo,18
45
- entari_plugin_hyw-3.3.7.dist-info/RECORD,,
45
+ entari_plugin_hyw-3.3.8.dist-info/METADATA,sha256=a6rO4NRoNrbOG3MjRbFeCxCuYkm8OoIYpAaibPxszgM,3598
46
+ entari_plugin_hyw-3.3.8.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
47
+ entari_plugin_hyw-3.3.8.dist-info/top_level.txt,sha256=TIDsn6XPs6KA5e3ezsE65JoXsy03ejDdrB41I4SPjmo,18
48
+ entari_plugin_hyw-3.3.8.dist-info/RECORD,,
@@ -1,142 +0,0 @@
1
- Metadata-Version: 2.4
2
- Name: entari_plugin_hyw
3
- Version: 3.3.7
4
- Summary: Use large language models to interpret chat messages
5
- Author-email: kumoSleeping <zjr2992@outlook.com>
6
- License: MIT
7
- Project-URL: Homepage, https://github.com/kumoSleeping/entari-plugin-hyw
8
- Project-URL: Repository, https://github.com/kumoSleeping/entari-plugin-hyw
9
- Project-URL: Issue Tracker, https://github.com/kumoSleeping/entari-plugin-hyw/issues
10
- Keywords: entari,llm,ai,bot,chat
11
- Classifier: Development Status :: 3 - Alpha
12
- Classifier: Intended Audience :: Developers
13
- Classifier: License :: OSI Approved :: MIT License
14
- Classifier: Programming Language :: Python :: 3.10
15
- Classifier: Programming Language :: Python :: 3.11
16
- Classifier: Programming Language :: Python :: 3.12
17
- Requires-Python: >=3.10
18
- Description-Content-Type: text/markdown
19
- Requires-Dist: arclet-entari[full]>=0.16.5
20
- Requires-Dist: openai
21
- Requires-Dist: httpx
22
- Requires-Dist: markdown>=3.10
23
- Requires-Dist: crawl4ai>=0.7.8
24
- Requires-Dist: jinja2>=3.0
25
- Requires-Dist: ddgs>=9.10.0
26
- Provides-Extra: dev
27
- Requires-Dist: entari-plugin-server>=0.5.0; extra == "dev"
28
- Requires-Dist: satori-python-adapter-onebot11>=0.2.5; extra == "dev"
29
-
30
-
31
- # Entari Plugin HYW
32
-
33
-
34
- [![PyPI version](https://badge.fury.io/py/entari-plugin-hyw.svg)](https://badge.fury.io/py/entari-plugin-hyw)
35
- [![License: MIT](https://img.shields.io/badge/License-MIT-yellow.svg)](https://opensource.org/licenses/MIT)
36
- [![Python Versions](https://img.shields.io/pypi/pyversions/entari-plugin-hyw.svg)](https://pypi.org/project/entari-plugin-hyw/)
37
-
38
- **Entari Plugin HYW** is an advanced agentic chat plugin for the [Entari](https://github.com/entari-org/entari) framework. It leverages Large Language Models (LLMs) to provide intelligent, context-aware, and multi-modal responses within instant messaging environments (OneBot 11, Satori).
39
-
40
- **Entari Plugin HYW** 是 Entari 框架的高级智能体聊天插件。它利用大语言模型(LLM)在即时通讯环境(OneBot 11, Satori)中提供智能、上下文感知和多模态的回复体验。
41
-
42
- The plugin implements a three-stage pipeline (**Vision**, **Instruct**, **Agent**) to autonomously decide when to search the web, crawl pages, or analyze images to answer user queries effectively.
43
-
44
- 插件实现了三阶段流水线(**视觉**、**指令**、**代理**),能够自主决定何时搜索网络、抓取网页或分析图片,从而高效地回答用户问题。
45
-
46
- <img src="demo.jpg" width="300" />
47
-
48
- ## Features / 功能特性
49
-
50
- - 📖 **Agentic Workflow (智能工作流)**
51
- Autonomous decision-making process to search, browse, and reason.
52
- 具备自主决策能力,能够自动进行搜索、网页浏览和逻辑推理。
53
-
54
- - 🎑 **Multi-Modal Support (多模态支持)**
55
- Native support for image analysis using Vision Language Models (VLMs).
56
- 原生支持图片分析,利用视觉语言模型(VLM)理解图像内容。
57
-
58
- - 🔍 **Web Search & Crawling (搜索与抓取)**
59
- Integrated **DuckDuckGo** and **Crawl4AI** for real-time information retrieval.
60
- 集成 DuckDuckGo 搜索与 Crawl4AI 网页抓取,实时获取互联网信息。
61
-
62
- - 🎨 **Rich Rendering (富媒体渲染)**
63
- Responses are rendered as images containing Markdown, syntax-highlighted code, LaTeX math, and citation badges.
64
- 回答将渲染为包含 Markdown、代码高亮、LaTeX 公式及引用角标的精美图片。
65
-
66
- - 🔌 **Protocol Support (多协议适配)**
67
- Deep integration with OneBot 11 and Satori protocols.
68
- 深度适配 OneBot 11 和 Satori 协议,完美处理回复上下文与 JSON 卡片。
69
-
70
- ## Installation / 安装
71
-
72
- ```bash
73
- pip install entari-plugin-hyw
74
- ```
75
-
76
- ## Configuration / 配置
77
-
78
- Configure the plugin in your `entari.yml`.
79
- 在 `entari.yml` 中进行配置。
80
-
81
- ### Minimal Configuration / 最小配置
82
-
83
- ```yaml
84
- plugins:
85
- entari_plugin_hyw:
86
- # Trigger command / 触发指令
87
- question_command: ".q"
88
-
89
- # Main Model (Required) / 主模型(必需)
90
- model_name: "google/gemini-2.0-flash-exp"
91
- api_key: "your-api-key-here"
92
- base_url: "https://generativelanguage.googleapis.com/v1beta/openai/"
93
- ```
94
-
95
- ### Configuration Reference / 配置详解
96
-
97
- | Option (选项) | Type | Default | Description (说明) |
98
- | :--- | :--- | :--- | :--- |
99
- | **Basic** | | | |
100
- | `question_command` | `str` | `/q` | The command to trigger the bot. <br> 触发机器人的指令前缀。 |
101
- | `reaction` | `bool` | `true` | React with emoji on start(now only lagrange ob extension). <br> 收到指令时是否回应表情(目前只支持拉格兰ob扩展)。 |
102
- | `quote` | `bool` | `true` | Quote the user's message in reply. <br> 回复时是否引用原消息。 |
103
- | **Models** | | | |
104
- | `model_name` | `str` | *None* | **Required.** Main Agent model ID. <br> **必需。** 主代理模型 ID。 |
105
- | `api_key` | `str` | *None* | **Required.** API key. <br> **必需。** API 密钥。 |
106
- | `base_url` | `str` | `...` | OpenAI-compatible API base URL. <br> 兼容 OpenAI 的 API 地址。 |
107
- | `extra_body` | `dict` | `null` | Extra parameters (e.g. `reasoning_effort`). <br> 传递给 LLM 的额外参数。 |
108
- | **Specialized** | | | |
109
- | `vision_model_name`| `str` | *None* | Model for images. Defaults to `model_name`. <br> 处理图片的模型,默认同主模型。 |
110
- | `intruct_model_name`| `str` | *None* | Model for intent. Defaults to `model_name`. <br> 意图识别模型,默认同主模型。 |
111
- | **Tools** | | | |
112
- | `search_provider` | `str` | `ddgs`| `ddgs` (DuckDuckGo), `crawl4ai`, `httpx`. <br> 搜索后端提供商。 |
113
- | `search_limit` | `int` | `8` | Max search results. <br> 搜索结果数量限制。 |
114
- | `headless` | `bool` | `true` | Browser headless mode. <br> 浏览器无头模式。 |
115
-
116
- ## Usage / 使用方法
117
-
118
- ### Commands / 指令
119
-
120
- - **Text Query (文本问答)**
121
- ```text
122
- .q What's the latest news on Rust 1.83?
123
- .q Rust 1.83 有什么新特性?
124
- ```
125
-
126
- - **Image Analysis (图片分析)**
127
- *(Send an image with command, or reply to an image)*
128
- *(发送带图片的指令,或回复一张图片)*
129
- ```text
130
- .q [Image] Explain this error.
131
- .q [图片] 解释一下这个报错。
132
- ```
133
-
134
- - **Follow-up (追问)**
135
- *Reply to the bot's message to continue the conversation.*
136
- *直接回复机器人的消息即可进行连续对话。*
137
-
138
- -----
139
-
140
- ## License
141
-
142
- This project is licensed under the MIT License.