sophhub 0.4.19 → 0.4.21

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (633) hide show
  1. package/README.md +199 -187
  2. package/agents/ai-cs-admin/.config.json +51 -51
  3. package/agents/ai-cs-admin/AGENTS.md +293 -293
  4. package/agents/ai-cs-admin/HEARTBEAT.md +18 -18
  5. package/agents/ai-cs-qa/.config.json +47 -47
  6. package/agents/ai-cs-qa/BOOTSTRAP.md +22 -22
  7. package/agents/ai-cs-qa/scripts/setup_links.sh +39 -39
  8. package/agents/beauty/.config.json +17 -17
  9. package/agents/beauty/AGENTS.md +234 -234
  10. package/agents/beauty/BOOTSTRAP.md +55 -55
  11. package/agents/beauty/HEARTBEAT.md +5 -5
  12. package/agents/beauty/IDENTITY.md +5 -5
  13. package/agents/beauty/MEMORY.md +44 -44
  14. package/agents/beauty/SOUL.md +64 -64
  15. package/agents/beauty/TOOLS.md +160 -160
  16. package/agents/beauty/USER.md +114 -114
  17. package/agents/intern-admin/.config.json +60 -60
  18. package/agents/intern-admin/AGENTS.md +267 -267
  19. package/agents/intern-admin/BOOTSTRAP.md +21 -21
  20. package/agents/intern-admin/HEARTBEAT.md +3 -3
  21. package/agents/intern-admin/IDENTITY.md +6 -6
  22. package/agents/intern-admin/MEMORY.md +21 -21
  23. package/agents/intern-admin/SOUL.md +23 -23
  24. package/agents/intern-admin/TOOLS.md +93 -93
  25. package/agents/intern-admin/USER.md +16 -16
  26. package/agents/intern-admin/scripts/init_workspace.sh +27 -27
  27. package/agents/intern-qa/.config.json +46 -46
  28. package/agents/intern-qa/AGENTS.md +303 -303
  29. package/agents/intern-qa/BOOTSTRAP.md +16 -16
  30. package/agents/intern-qa/HEARTBEAT.md +3 -3
  31. package/agents/intern-qa/IDENTITY.md +6 -6
  32. package/agents/intern-qa/MEMORY.md +22 -22
  33. package/agents/intern-qa/SOUL.md +24 -24
  34. package/agents/intern-qa/TOOLS.md +24 -24
  35. package/agents/intern-qa/USER.md +27 -27
  36. package/agents/intern-qa/scripts/setup_links.sh +54 -54
  37. package/agents/parent-toddler/.config.json +37 -37
  38. package/agents/parent-toddler/AGENTS.md +51 -51
  39. package/agents/parent-toddler/BOOTSTRAP.md +55 -55
  40. package/agents/parent-toddler/HEARTBEAT.md +5 -5
  41. package/agents/parent-toddler/IDENTITY.md +5 -5
  42. package/agents/parent-toddler/MEMORY.md +22 -22
  43. package/agents/parent-toddler/SOUL.md +35 -35
  44. package/agents/parent-toddler/TOOLS.md +31 -31
  45. package/agents/parent-toddler/USER.md +44 -44
  46. package/agents/vip-admin/.config.json +51 -51
  47. package/agents/vip-admin/AGENTS.md +314 -314
  48. package/agents/vip-admin/BOOTSTRAP.md +21 -21
  49. package/agents/vip-admin/HEARTBEAT.md +19 -19
  50. package/agents/vip-admin/IDENTITY.md +6 -6
  51. package/agents/vip-admin/MEMORY.md +30 -30
  52. package/agents/vip-admin/SOUL.md +25 -25
  53. package/agents/vip-admin/TOOLS.md +108 -108
  54. package/agents/vip-admin/USER.md +31 -31
  55. package/agents/vip-qa/.config.json +58 -58
  56. package/agents/vip-qa/AGENTS.md +319 -319
  57. package/agents/vip-qa/BOOTSTRAP.md +73 -73
  58. package/agents/vip-qa/HEARTBEAT.md +23 -23
  59. package/agents/vip-qa/IDENTITY.md +7 -7
  60. package/agents/vip-qa/MEMORY.md +23 -23
  61. package/agents/vip-qa/SOUL.md +34 -34
  62. package/agents/vip-qa/TOOLS.md +41 -41
  63. package/agents/vip-qa/USER.md +16 -16
  64. package/agents/vip-qa/scripts/setup_links.sh +39 -39
  65. package/bin/sophhub.js +25 -25
  66. package/package.json +35 -33
  67. package/skills/agent-install/skill.json +34 -34
  68. package/skills/agent-install/src/SKILL.md +240 -240
  69. package/skills/agent-install/src/pyproject.toml +6 -6
  70. package/skills/agent-install/src/scripts/backup_agent.py +120 -120
  71. package/skills/agent-install/src/scripts/check_installed.py +479 -479
  72. package/skills/agent-install/src/scripts/common.py +568 -568
  73. package/skills/agent-install/src/scripts/copy_agent_files.py +59 -59
  74. package/skills/agent-install/src/scripts/list_agents.py +285 -285
  75. package/skills/agent-install/src/scripts/resolve_install_params.py +90 -90
  76. package/skills/agent-install/src/scripts/update_agent_md.py +76 -76
  77. package/skills/agent-install/src/scripts/update_openclaw.py +193 -193
  78. package/skills/agent-install/src/scripts/verify_download.py +148 -148
  79. package/skills/aippt/skill.json +20 -20
  80. package/skills/aippt/src/SKILL.md +235 -235
  81. package/skills/aippt/src/pyproject.toml +8 -8
  82. package/skills/aippt/src/scripts/auth.py +122 -122
  83. package/skills/aippt/src/scripts/ppt.py +361 -361
  84. package/skills/aippt/src/scripts/provider_docmee.py +299 -299
  85. package/skills/beauty-salon-inventory/skill.json +16 -16
  86. package/skills/beauty-salon-inventory/src/SKILL.md +69 -69
  87. package/skills/beauty-salon-inventory/src/scripts/init_salon_inventory.py +39 -39
  88. package/skills/beauty-salon-inventory/src/scripts/init_salon_inventory.sh +4 -4
  89. package/skills/beauty-salon-inventory/src/scripts/salon_inventory_cli.py +244 -244
  90. package/skills/beauty-salon-marketing/skill.json +10 -10
  91. package/skills/beauty-salon-marketing/src/SKILL.md +36 -36
  92. package/skills/beauty-salon-marketing/src/playbooks/beauty-salon-festival.md +19 -19
  93. package/skills/beauty-salon-marketing/src/playbooks/beauty-salon-segment.md +18 -18
  94. package/skills/beauty-salon-marketing/src/scripts/beauty_marketing_cli.py +99 -99
  95. package/skills/beauty-salon-marketing/src/scripts/member_segment.py +114 -114
  96. package/skills/beauty-salon-member-appointment/skill.json +10 -10
  97. package/skills/beauty-salon-member-appointment/src/SKILL.md +36 -36
  98. package/skills/beauty-salon-member-appointment/src/pyproject.toml +9 -9
  99. package/skills/beauty-salon-member-appointment/src/scripts/run_e2e_smoke.py +160 -160
  100. package/skills/beauty-salon-member-appointment/src/src/member_appt_cli/__init__.py +1 -1
  101. package/skills/beauty-salon-member-appointment/src/src/member_appt_cli/__main__.py +4 -4
  102. package/skills/beauty-salon-member-appointment/src/src/member_appt_cli/cli.py +921 -921
  103. package/skills/beauty-salon-member-appointment/src/src/member_appt_cli/db.py +30 -30
  104. package/skills/beauty-salon-membership/skill.json +20 -20
  105. package/skills/beauty-salon-membership/src/SKILL.md +67 -67
  106. package/skills/beauty-salon-product-service/skill.json +12 -12
  107. package/skills/beauty-salon-product-service/src/SKILL.md +42 -42
  108. package/skills/beauty-salon-product-service/src/pyproject.toml +9 -9
  109. package/skills/beauty-salon-product-service/src/src/product_service_cli/__init__.py +1 -1
  110. package/skills/beauty-salon-product-service/src/src/product_service_cli/__main__.py +4 -4
  111. package/skills/beauty-salon-product-service/src/src/product_service_cli/cli.py +329 -329
  112. package/skills/beauty-salon-product-service/src/src/product_service_cli/db.py +29 -29
  113. package/skills/beauty-salon-staff/skill.json +10 -10
  114. package/skills/beauty-salon-staff/src/SKILL.md +37 -37
  115. package/skills/beauty-salon-staff/src/pyproject.toml +9 -9
  116. package/skills/beauty-salon-staff/src/src/staff_cli/__init__.py +1 -1
  117. package/skills/beauty-salon-staff/src/src/staff_cli/__main__.py +4 -4
  118. package/skills/beauty-salon-staff/src/src/staff_cli/cli.py +479 -479
  119. package/skills/beauty-salon-staff/src/src/staff_cli/db.py +28 -28
  120. package/skills/beauty-salon-suite/skill.json +13 -13
  121. package/skills/beauty-salon-suite/src/SKILL.md +18 -18
  122. package/skills/beauty-salon-suite/src/beauty_db/__init__.py +2 -2
  123. package/skills/beauty-salon-suite/src/beauty_db/db.py +249 -249
  124. package/skills/beauty-salon-traffic/skill.json +20 -20
  125. package/skills/beauty-salon-traffic/src/SKILL.md +84 -84
  126. package/skills/bing-image-search/skill.json +20 -20
  127. package/skills/bing-image-search/src/SKILL.md +105 -105
  128. package/skills/bot-api-status/skill.json +44 -44
  129. package/skills/bot-api-status/src/SKILL.md +99 -99
  130. package/skills/bot-api-status/src/pyproject.toml +5 -5
  131. package/skills/bot-api-status/src/scripts/secret.py +496 -496
  132. package/skills/bot-secret/skill.json +35 -35
  133. package/skills/bot-secret/src/SKILL.md +51 -51
  134. package/skills/bot-secret/src/pyproject.toml +5 -5
  135. package/skills/bot-secret/src/scripts/secret.py +120 -120
  136. package/skills/cake-flower-holiday-campaign/skill.json +20 -20
  137. package/skills/cake-flower-holiday-campaign/src/SKILL.md +68 -68
  138. package/skills/cake-flower-order-sop/skill.json +20 -20
  139. package/skills/cake-flower-order-sop/src/SKILL.md +65 -65
  140. package/skills/claw-agent-get-send/skill.json +32 -32
  141. package/skills/claw-agent-get-send/src/SKILL.md +43 -43
  142. package/skills/claw-agent-get-send/src/pyproject.toml +5 -5
  143. package/skills/claw-agent-get-send/src/scripts/appia_claw.py +379 -379
  144. package/skills/compact-context/skill.json +20 -20
  145. package/skills/compact-context/src/SKILL.md +133 -133
  146. package/skills/compact-context/src/scripts/check.sh +381 -381
  147. package/skills/compact-context/src/scripts/set-keep-recent.mjs +1337 -1337
  148. package/skills/compact-context/src/scripts/setup.sh +96 -96
  149. package/skills/consensus/skill.json +20 -20
  150. package/skills/consensus/src/SKILL.md +93 -93
  151. package/skills/deepwiki/skill.json +20 -20
  152. package/skills/deepwiki/src/SKILL.md +45 -45
  153. package/skills/deepwiki/src/_meta.json +5 -5
  154. package/skills/deepwiki/src/scripts/deepwiki.js +135 -135
  155. package/skills/didi-ride/skill.json +20 -20
  156. package/skills/didi-ride/src/SKILL.md +309 -309
  157. package/skills/didi-ride/src/_meta.json +5 -5
  158. package/skills/didi-ride/src/assets/PREFERENCE.md +58 -58
  159. package/skills/didi-ride/src/package.json +15 -15
  160. package/skills/didi-ride/src/references/api_references.md +171 -171
  161. package/skills/didi-ride/src/references/error_handling.md +68 -68
  162. package/skills/didi-ride/src/references/setup.md +73 -73
  163. package/skills/didi-ride/src/references/workflow.md +150 -150
  164. package/skills/feishu-bitable/skill.json +20 -20
  165. package/skills/feishu-bitable/src/CHECKLIST.md +149 -149
  166. package/skills/feishu-bitable/src/README.md +177 -177
  167. package/skills/feishu-bitable/src/SKILL.md +113 -113
  168. package/skills/feishu-bitable/src/_meta.json +5 -5
  169. package/skills/feishu-bitable/src/api.js +380 -380
  170. package/skills/feishu-bitable/src/bin/cli.js +283 -283
  171. package/skills/feishu-bitable/src/description.md +142 -142
  172. package/skills/feishu-bitable/src/examples/create-records.json +51 -51
  173. package/skills/feishu-bitable/src/examples/create-table.json +63 -63
  174. package/skills/feishu-bitable/src/package-lock.json +324 -324
  175. package/skills/feishu-bitable/src/package.json +32 -32
  176. package/skills/feishu-bitable/src/publish-config.json +13 -13
  177. package/skills/feishu-bitable/src/test-simple.js +60 -60
  178. package/skills/feishu-bitable/src/utils.js +260 -260
  179. package/skills/feishu-notes-assistant-universal/skill.json +20 -20
  180. package/skills/feishu-notes-assistant-universal/src/README.md +55 -55
  181. package/skills/feishu-notes-assistant-universal/src/SKILL.md +159 -159
  182. package/skills/feishu-notes-assistant-universal/src/scripts/_resolve_lark_cli.py +58 -58
  183. package/skills/feishu-notes-assistant-universal/src/scripts/openclaw_meeting_minutes.py +462 -462
  184. package/skills/feishu-notes-assistant-universal/src/scripts/openclaw_notes_crud.py +547 -547
  185. package/skills/feishu-notes-assistant-universal/src/scripts/openclaw_notes_crud_test.py +181 -181
  186. package/skills/feishu-notes-assistant-universal/src/scripts/run_meeting_minutes.py +80 -80
  187. package/skills/feishu-notes-assistant-universal/src/scripts/run_meeting_minutes.sh +5 -5
  188. package/skills/feishu-notes-assistant-universal/src/scripts/run_note_crud.py +32 -32
  189. package/skills/feishu-notes-assistant-universal/src/scripts/run_note_crud.sh +5 -5
  190. package/skills/flight-booking/skill.json +36 -36
  191. package/skills/flight-booking/src/SKILL.md +288 -288
  192. package/skills/flight-booking/src/scripts/flight_booking.py +1237 -1237
  193. package/skills/flyai/skill.json +20 -20
  194. package/skills/flyai/src/SKILL.md +119 -119
  195. package/skills/flyai/src/references/fliggy-fast-search.md +53 -53
  196. package/skills/flyai/src/references/search-flight.md +89 -89
  197. package/skills/flyai/src/references/search-hotels.md +57 -57
  198. package/skills/flyai/src/references/search-poi.md +48 -48
  199. package/skills/google-maps/skill.json +20 -20
  200. package/skills/google-maps/src/SKILL.md +237 -237
  201. package/skills/google-maps/src/_meta.json +5 -5
  202. package/skills/google-maps/src/lib/map_helper.py +912 -912
  203. package/skills/image-classify/skill.json +42 -42
  204. package/skills/image-classify/src/SKILL.md +368 -368
  205. package/skills/image-classify/src/references/config.json +4 -4
  206. package/skills/image-classify/src/scripts/face_search.py +1276 -1276
  207. package/skills/image-description/skill.json +34 -34
  208. package/skills/image-description/src/SKILL.md +33 -33
  209. package/skills/image-description/src/pyproject.toml +8 -8
  210. package/skills/image-description/src/scripts/ana_image.py +112 -112
  211. package/skills/image-identify-world/skill.json +20 -20
  212. package/skills/image-identify-world/src/SKILL.md +40 -40
  213. package/skills/image-identify-world/src/pyproject.toml +8 -8
  214. package/skills/image-identify-world/src/scripts/identify_world.py +115 -115
  215. package/skills/insurance-policy-review/skill.json +27 -27
  216. package/skills/insurance-policy-review/src/SKILL.md +75 -75
  217. package/skills/insurance-sales-playbook/skill.json +20 -20
  218. package/skills/insurance-sales-playbook/src/SKILL.md +58 -58
  219. package/skills/inventory-management/skill.json +20 -20
  220. package/skills/inventory-management/src/SKILL.md +241 -241
  221. package/skills/inventory-management/src/scripts/inventory.py +1844 -1844
  222. package/skills/large-task-router/skill.json +20 -20
  223. package/skills/large-task-router/src/SKILL.md +79 -79
  224. package/skills/large-task-router/src/templates/plan.md +74 -74
  225. package/skills/lawding-contract-review/skill.json +20 -20
  226. package/skills/lawding-contract-review/src/SKILL.md +284 -284
  227. package/skills/lawding-contract-review/src/references/legal-language-library.md +1385 -1385
  228. package/skills/lawding-contract-review/src/scripts/build_reminders.py +471 -471
  229. package/skills/lawding-contract-review/src/scripts/register_contract_cron.py +457 -457
  230. package/skills/md2pdf-converter/skill.json +20 -20
  231. package/skills/md2pdf-converter/src/SKILL.md +244 -244
  232. package/skills/md2pdf-converter/src/_meta.json +5 -5
  233. package/skills/md2pdf-converter/src/scripts/generate_emoji_mapping.py +74 -74
  234. package/skills/md2pdf-converter/src/scripts/md2pdf-local.sh +291 -291
  235. package/skills/notes-hub-assistant/skill.json +20 -20
  236. package/skills/notes-hub-assistant/src/SKILL.md +233 -233
  237. package/skills/notes-hub-assistant/src/scripts/_resolve_lark_cli.py +48 -48
  238. package/skills/notes-hub-assistant/src/scripts/openclaw_meeting_minutes.py +473 -473
  239. package/skills/notes-hub-assistant/src/scripts/openclaw_notes_crud.py +596 -596
  240. package/skills/notes-hub-assistant/src/scripts/openclaw_wolai_notes_crud.py +364 -364
  241. package/skills/notes-hub-assistant/src/scripts/run_meeting_minutes.py +79 -79
  242. package/skills/notes-hub-assistant/src/scripts/run_note_crud.py +37 -37
  243. package/skills/notes-hub-assistant/src/scripts/run_notionbot.py +36 -36
  244. package/skills/notes-hub-assistant/src/scripts/run_wolai_note_crud.py +27 -27
  245. package/skills/schedule-reminder/skill.json +20 -20
  246. package/skills/schedule-reminder/src/SKILL.md +619 -619
  247. package/skills/schedule-reminder/src/schedule_template.md +68 -68
  248. package/skills/schedule-reminder/src/scripts/append_event.py +204 -204
  249. package/skills/schedule-reminder/src/scripts/create_reminders.sh +163 -163
  250. package/skills/schedule-reminder/src/scripts/daily_activate.sh +175 -175
  251. package/skills/schedule-reminder/src/scripts/parse_schedule.py +704 -704
  252. package/skills/schedule-reminder/src/scripts/setup.sh +242 -242
  253. package/skills/schedule-reminder/src//347/224/250/346/210/267/346/214/207/345/215/227.md +311 -311
  254. package/skills/sessions-analysis/skill.json +34 -34
  255. package/skills/sessions-analysis/src/SKILL.md +81 -81
  256. package/skills/sessions-analysis/src/pyproject.toml +5 -5
  257. package/skills/sessions-analysis/src/scripts/ana_logs.py +205 -205
  258. package/skills/share-skill/skill.json +20 -20
  259. package/skills/share-skill/src/SKILL.md +261 -261
  260. package/skills/share-skill/src/scripts/share_skill_to_friend.py +1031 -1031
  261. package/skills/skill-creator/skill.json +20 -20
  262. package/skills/skill-creator/src/SKILL.md +370 -370
  263. package/skills/skill-creator/src/license.txt +202 -202
  264. package/skills/skill-creator/src/scripts/init_skill.py +378 -378
  265. package/skills/skill-creator/src/scripts/package_skill.py +111 -111
  266. package/skills/skill-creator/src/scripts/quick_validate.py +101 -101
  267. package/skills/skillhub/skill.json +27 -27
  268. package/skills/skillhub/src/SKILL.md +121 -121
  269. package/skills/sophnet-age-appearance/skill.json +20 -20
  270. package/skills/sophnet-age-appearance/src/SKILL.md +83 -83
  271. package/skills/sophnet-age-appearance/src/pyproject.toml +10 -10
  272. package/skills/sophnet-age-appearance/src/scripts/age_appearance.py +395 -395
  273. package/skills/sophnet-age-appearance/src/scripts/age_face_crop.py +313 -313
  274. package/skills/sophnet-bot-client/skill.json +20 -20
  275. package/skills/sophnet-bot-client/src/SKILL.md +255 -255
  276. package/skills/sophnet-bot-client/src/pyproject.toml +13 -13
  277. package/skills/sophnet-bot-client/src/scripts/bot_client_proxy.py +165 -165
  278. package/skills/sophnet-bot-client/src/scripts/bot_client_safe.sh +29 -29
  279. package/skills/sophnet-bot-client/src/scripts/bot_client_setup.py +502 -502
  280. package/skills/sophnet-bot-client/src/tests/test_bot_client_proxy.py +255 -255
  281. package/skills/sophnet-bot-client/src/tests/test_bot_client_setup.py +679 -679
  282. package/skills/sophnet-bot-client/src/uv.lock +8 -8
  283. package/skills/sophnet-customer-management/skill.json +20 -20
  284. package/skills/sophnet-customer-management/src/SKILL.md +270 -270
  285. package/skills/sophnet-customer-management/src/pyproject.toml +15 -15
  286. package/skills/sophnet-customer-management/src/src/customer_mgmt_cli/__init__.py +2 -2
  287. package/skills/sophnet-customer-management/src/src/customer_mgmt_cli/__main__.py +5 -5
  288. package/skills/sophnet-customer-management/src/src/customer_mgmt_cli/cli.py +67 -67
  289. package/skills/sophnet-customer-management/src/src/customer_mgmt_cli/commands/__init__.py +2 -2
  290. package/skills/sophnet-customer-management/src/src/customer_mgmt_cli/commands/customer.py +60 -60
  291. package/skills/sophnet-customer-management/src/src/customer_mgmt_cli/commands/export_file.py +18 -18
  292. package/skills/sophnet-customer-management/src/src/customer_mgmt_cli/commands/import_file.py +15 -15
  293. package/skills/sophnet-customer-management/src/src/customer_mgmt_cli/commands/reminder.py +26 -26
  294. package/skills/sophnet-customer-management/src/src/customer_mgmt_cli/commands/schema.py +28 -28
  295. package/skills/sophnet-customer-management/src/src/customer_mgmt_cli/config.py +54 -54
  296. package/skills/sophnet-customer-management/src/src/customer_mgmt_core/__init__.py +2 -2
  297. package/skills/sophnet-customer-management/src/src/customer_mgmt_core/exporter.py +85 -85
  298. package/skills/sophnet-customer-management/src/src/customer_mgmt_core/models.py +84 -84
  299. package/skills/sophnet-customer-management/src/src/customer_mgmt_core/normalizer.py +144 -144
  300. package/skills/sophnet-customer-management/src/src/customer_mgmt_core/parser.py +241 -241
  301. package/skills/sophnet-customer-management/src/src/customer_mgmt_core/query.py +109 -109
  302. package/skills/sophnet-customer-management/src/src/customer_mgmt_core/reminder.py +121 -121
  303. package/skills/sophnet-customer-management/src/src/customer_mgmt_core/repository.py +397 -397
  304. package/skills/sophnet-customer-management/src/src/customer_mgmt_core/schema.py +106 -106
  305. package/skills/sophnet-customer-management/src/src/customer_mgmt_core/service.py +565 -565
  306. package/skills/sophnet-customer-management/src/uv.lock +48 -48
  307. package/skills/sophnet-customized-marketing/skill.json +28 -28
  308. package/skills/sophnet-customized-marketing/src/SKILL.md +144 -144
  309. package/skills/sophnet-customized-marketing/src/playbooks/campaign-planning.md +187 -187
  310. package/skills/sophnet-customized-marketing/src/playbooks/content-generation.md +124 -124
  311. package/skills/sophnet-customized-marketing/src/playbooks/marketing-calendar.md +59 -59
  312. package/skills/sophnet-customized-marketing/src/playbooks/multi-channel-bundle.md +94 -94
  313. package/skills/sophnet-customized-marketing/src/playbooks/poster-generation.md +182 -182
  314. package/skills/sophnet-customized-marketing/src/playbooks/style-profile-workflow.md +103 -103
  315. package/skills/sophnet-customized-marketing/src/pyproject.toml +8 -8
  316. package/skills/sophnet-customized-marketing/src/references/campaign-mechanics.md +168 -168
  317. package/skills/sophnet-customized-marketing/src/references/content-safety.md +26 -26
  318. package/skills/sophnet-customized-marketing/src/references/marketing-date-checklist.md +99 -99
  319. package/skills/sophnet-customized-marketing/src/references/platform-writing-guidelines.md +88 -88
  320. package/skills/sophnet-customized-marketing/src/references/quality-checklist.md +44 -44
  321. package/skills/sophnet-customized-marketing/src/scripts/generate_poster.py +572 -572
  322. package/skills/sophnet-customized-marketing/src/scripts/style_profile.py +215 -215
  323. package/skills/sophnet-dailynews/skill.json +20 -20
  324. package/skills/sophnet-dailynews/src/SKILL.md +179 -179
  325. package/skills/sophnet-dailynews/src/cache.json +150 -150
  326. package/skills/sophnet-dailynews/src/sources.json +230 -230
  327. package/skills/sophnet-docx/skill.json +20 -20
  328. package/skills/sophnet-docx/src/SKILL.md +463 -463
  329. package/skills/sophnet-docx/src/package-lock.json +208 -208
  330. package/skills/sophnet-docx/src/package.json +16 -16
  331. package/skills/sophnet-docx/src/pyproject.toml +11 -11
  332. package/skills/sophnet-docx/src/scripts/__init__.py +1 -1
  333. package/skills/sophnet-docx/src/scripts/accept_changes.py +135 -135
  334. package/skills/sophnet-docx/src/scripts/comment.py +318 -318
  335. package/skills/sophnet-docx/src/scripts/ensure_uv_env.sh +68 -68
  336. package/skills/sophnet-docx/src/scripts/office/helpers/merge_runs.py +199 -199
  337. package/skills/sophnet-docx/src/scripts/office/helpers/simplify_redlines.py +197 -197
  338. package/skills/sophnet-docx/src/scripts/office/pack.py +159 -159
  339. package/skills/sophnet-docx/src/scripts/office/schemas/ISO-IEC29500-4_2016/dml-chart.xsd +1499 -1499
  340. package/skills/sophnet-docx/src/scripts/office/schemas/ISO-IEC29500-4_2016/dml-chartDrawing.xsd +146 -146
  341. package/skills/sophnet-docx/src/scripts/office/schemas/ISO-IEC29500-4_2016/dml-diagram.xsd +1085 -1085
  342. package/skills/sophnet-docx/src/scripts/office/schemas/ISO-IEC29500-4_2016/dml-lockedCanvas.xsd +11 -11
  343. package/skills/sophnet-docx/src/scripts/office/schemas/ISO-IEC29500-4_2016/dml-main.xsd +3081 -3081
  344. package/skills/sophnet-docx/src/scripts/office/schemas/ISO-IEC29500-4_2016/dml-picture.xsd +23 -23
  345. package/skills/sophnet-docx/src/scripts/office/schemas/ISO-IEC29500-4_2016/dml-spreadsheetDrawing.xsd +185 -185
  346. package/skills/sophnet-docx/src/scripts/office/schemas/ISO-IEC29500-4_2016/dml-wordprocessingDrawing.xsd +287 -287
  347. package/skills/sophnet-docx/src/scripts/office/schemas/ISO-IEC29500-4_2016/pml.xsd +1676 -1676
  348. package/skills/sophnet-docx/src/scripts/office/schemas/ISO-IEC29500-4_2016/shared-additionalCharacteristics.xsd +28 -28
  349. package/skills/sophnet-docx/src/scripts/office/schemas/ISO-IEC29500-4_2016/shared-bibliography.xsd +144 -144
  350. package/skills/sophnet-docx/src/scripts/office/schemas/ISO-IEC29500-4_2016/shared-commonSimpleTypes.xsd +174 -174
  351. package/skills/sophnet-docx/src/scripts/office/schemas/ISO-IEC29500-4_2016/shared-customXmlDataProperties.xsd +25 -25
  352. package/skills/sophnet-docx/src/scripts/office/schemas/ISO-IEC29500-4_2016/shared-customXmlSchemaProperties.xsd +18 -18
  353. package/skills/sophnet-docx/src/scripts/office/schemas/ISO-IEC29500-4_2016/shared-documentPropertiesCustom.xsd +59 -59
  354. package/skills/sophnet-docx/src/scripts/office/schemas/ISO-IEC29500-4_2016/shared-documentPropertiesExtended.xsd +56 -56
  355. package/skills/sophnet-docx/src/scripts/office/schemas/ISO-IEC29500-4_2016/shared-documentPropertiesVariantTypes.xsd +195 -195
  356. package/skills/sophnet-docx/src/scripts/office/schemas/ISO-IEC29500-4_2016/shared-math.xsd +582 -582
  357. package/skills/sophnet-docx/src/scripts/office/schemas/ISO-IEC29500-4_2016/shared-relationshipReference.xsd +25 -25
  358. package/skills/sophnet-docx/src/scripts/office/schemas/ISO-IEC29500-4_2016/sml.xsd +4439 -4439
  359. package/skills/sophnet-docx/src/scripts/office/schemas/ISO-IEC29500-4_2016/vml-main.xsd +570 -570
  360. package/skills/sophnet-docx/src/scripts/office/schemas/ISO-IEC29500-4_2016/vml-officeDrawing.xsd +509 -509
  361. package/skills/sophnet-docx/src/scripts/office/schemas/ISO-IEC29500-4_2016/vml-presentationDrawing.xsd +12 -12
  362. package/skills/sophnet-docx/src/scripts/office/schemas/ISO-IEC29500-4_2016/vml-spreadsheetDrawing.xsd +108 -108
  363. package/skills/sophnet-docx/src/scripts/office/schemas/ISO-IEC29500-4_2016/vml-wordprocessingDrawing.xsd +96 -96
  364. package/skills/sophnet-docx/src/scripts/office/schemas/ISO-IEC29500-4_2016/wml.xsd +3646 -3646
  365. package/skills/sophnet-docx/src/scripts/office/schemas/ISO-IEC29500-4_2016/xml.xsd +116 -116
  366. package/skills/sophnet-docx/src/scripts/office/schemas/ecma/fouth-edition/opc-contentTypes.xsd +42 -42
  367. package/skills/sophnet-docx/src/scripts/office/schemas/ecma/fouth-edition/opc-coreProperties.xsd +50 -50
  368. package/skills/sophnet-docx/src/scripts/office/schemas/ecma/fouth-edition/opc-digSig.xsd +49 -49
  369. package/skills/sophnet-docx/src/scripts/office/schemas/ecma/fouth-edition/opc-relationships.xsd +33 -33
  370. package/skills/sophnet-docx/src/scripts/office/schemas/mce/mc.xsd +75 -75
  371. package/skills/sophnet-docx/src/scripts/office/schemas/microsoft/wml-2010.xsd +560 -560
  372. package/skills/sophnet-docx/src/scripts/office/schemas/microsoft/wml-2012.xsd +67 -67
  373. package/skills/sophnet-docx/src/scripts/office/schemas/microsoft/wml-2018.xsd +14 -14
  374. package/skills/sophnet-docx/src/scripts/office/schemas/microsoft/wml-cex-2018.xsd +20 -20
  375. package/skills/sophnet-docx/src/scripts/office/schemas/microsoft/wml-cid-2016.xsd +13 -13
  376. package/skills/sophnet-docx/src/scripts/office/schemas/microsoft/wml-sdtdatahash-2020.xsd +4 -4
  377. package/skills/sophnet-docx/src/scripts/office/schemas/microsoft/wml-symex-2015.xsd +8 -8
  378. package/skills/sophnet-docx/src/scripts/office/soffice.py +183 -183
  379. package/skills/sophnet-docx/src/scripts/office/unpack.py +132 -132
  380. package/skills/sophnet-docx/src/scripts/office/validate.py +111 -111
  381. package/skills/sophnet-docx/src/scripts/office/validators/__init__.py +15 -15
  382. package/skills/sophnet-docx/src/scripts/office/validators/base.py +847 -847
  383. package/skills/sophnet-docx/src/scripts/office/validators/docx.py +446 -446
  384. package/skills/sophnet-docx/src/scripts/office/validators/pptx.py +275 -275
  385. package/skills/sophnet-docx/src/scripts/office/validators/redlining.py +247 -247
  386. package/skills/sophnet-docx/src/scripts/templates/comments.xml +3 -3
  387. package/skills/sophnet-docx/src/scripts/templates/commentsExtended.xml +3 -3
  388. package/skills/sophnet-docx/src/scripts/templates/commentsExtensible.xml +3 -3
  389. package/skills/sophnet-docx/src/scripts/templates/commentsIds.xml +3 -3
  390. package/skills/sophnet-docx/src/scripts/templates/people.xml +3 -3
  391. package/skills/sophnet-docx/src/scripts/upload_file.sh +96 -96
  392. package/skills/sophnet-docx/src/uv.lock +320 -320
  393. package/skills/sophnet-face-search/skill.json +20 -20
  394. package/skills/sophnet-face-search/src/SKILL.md +115 -115
  395. package/skills/sophnet-face-search/src/pyproject.toml +11 -11
  396. package/skills/sophnet-face-search/src/scripts/face_search.py +335 -335
  397. package/skills/sophnet-face-search/src/uv.lock +508 -508
  398. package/skills/sophnet-id-photo/skill.json +20 -20
  399. package/skills/sophnet-id-photo/src/SKILL.md +107 -107
  400. package/skills/sophnet-id-photo/src/pyproject.toml +10 -10
  401. package/skills/sophnet-id-photo/src/scripts/id_photo.py +540 -540
  402. package/skills/sophnet-id-photo/src/scripts/id_photo_compliance.py +215 -215
  403. package/skills/sophnet-id-photo/src/scripts/id_photo_face_crop.py +313 -313
  404. package/skills/sophnet-image-edit/skill.json +20 -20
  405. package/skills/sophnet-image-edit/src/SKILL.md +140 -140
  406. package/skills/sophnet-image-edit/src/pyproject.toml +9 -9
  407. package/skills/sophnet-image-edit/src/scripts/edit_and_preview.sh +68 -68
  408. package/skills/sophnet-image-edit/src/scripts/edit_image.py +279 -279
  409. package/skills/sophnet-image-edit/src/uv.lock +234 -234
  410. package/skills/sophnet-image-generate/skill.json +20 -20
  411. package/skills/sophnet-image-generate/src/SKILL.md +62 -62
  412. package/skills/sophnet-image-generate/src/pyproject.toml +9 -9
  413. package/skills/sophnet-image-generate/src/scripts/generate_image.py +156 -156
  414. package/skills/sophnet-image-generate/src/uv.lock +234 -234
  415. package/skills/sophnet-image-ocr/skill.json +20 -20
  416. package/skills/sophnet-image-ocr/src/SKILL.md +167 -167
  417. package/skills/sophnet-image-ocr/src/pyproject.toml +13 -13
  418. package/skills/sophnet-image-ocr/src/scripts/ocr.py +225 -225
  419. package/skills/sophnet-image-ocr/src/uv.lock +234 -234
  420. package/skills/sophnet-infinite-talk/skill.json +20 -20
  421. package/skills/sophnet-infinite-talk/src/SKILL.md +140 -140
  422. package/skills/sophnet-infinite-talk/src/pyproject.toml +9 -9
  423. package/skills/sophnet-infinite-talk/src/scripts/gen.py +172 -172
  424. package/skills/sophnet-oss/skill.json +27 -27
  425. package/skills/sophnet-oss/src/SKILL.md +118 -118
  426. package/skills/sophnet-oss/src/pyproject.toml +8 -8
  427. package/skills/sophnet-oss/src/scripts/upload_file.py +43 -43
  428. package/skills/sophnet-pdf/skill.json +20 -20
  429. package/skills/sophnet-pdf/src/SKILL.md +413 -413
  430. package/skills/sophnet-pdf/src/forms.md +297 -297
  431. package/skills/sophnet-pdf/src/pyproject.toml +14 -14
  432. package/skills/sophnet-pdf/src/reference.md +611 -611
  433. package/skills/sophnet-pdf/src/scripts/check_bounding_boxes.py +65 -65
  434. package/skills/sophnet-pdf/src/scripts/check_fillable_fields.py +11 -11
  435. package/skills/sophnet-pdf/src/scripts/convert_pdf_to_images.py +33 -33
  436. package/skills/sophnet-pdf/src/scripts/create_validation_image.py +37 -37
  437. package/skills/sophnet-pdf/src/scripts/enhance_tutorial.py +557 -557
  438. package/skills/sophnet-pdf/src/scripts/ensure_uv_env.sh +68 -68
  439. package/skills/sophnet-pdf/src/scripts/extract_form_field_info.py +122 -122
  440. package/skills/sophnet-pdf/src/scripts/extract_form_structure.py +115 -115
  441. package/skills/sophnet-pdf/src/scripts/extract_pdf_content.py +34 -34
  442. package/skills/sophnet-pdf/src/scripts/fill_fillable_fields.py +98 -98
  443. package/skills/sophnet-pdf/src/scripts/fill_pdf_form_with_annotations.py +107 -107
  444. package/skills/sophnet-pdf/src/scripts/upload_file.sh +88 -88
  445. package/skills/sophnet-pdf/src/uv.lock +537 -537
  446. package/skills/sophnet-qa-install/skill.json +27 -27
  447. package/skills/sophnet-qa-install/src/SKILL.md +210 -210
  448. package/skills/sophnet-qa-install/src/pyproject.toml +6 -6
  449. package/skills/sophnet-qa-install/src/scripts/backup_md.py +35 -35
  450. package/skills/sophnet-qa-install/src/scripts/check_installed.py +143 -143
  451. package/skills/sophnet-qa-install/src/scripts/update_config.py +142 -142
  452. package/skills/sophnet-qa-install/src/scripts/update_md.py +73 -73
  453. package/skills/sophnet-schedule/skill.json +20 -20
  454. package/skills/sophnet-schedule/src/ARCHITECTURE.md +321 -321
  455. package/skills/sophnet-schedule/src/IMPROVEMENTS.md +145 -145
  456. package/skills/sophnet-schedule/src/SKILL.md +1050 -1050
  457. package/skills/sophnet-schedule/src/_meta.json +6 -6
  458. package/skills/sophnet-schedule/src/api/models.py +245 -245
  459. package/skills/sophnet-schedule/src/apps/add_event.py +237 -237
  460. package/skills/sophnet-schedule/src/apps/check_reminders.py +112 -112
  461. package/skills/sophnet-schedule/src/apps/check_roc.py +246 -246
  462. package/skills/sophnet-schedule/src/apps/generate_daily_plan.py +342 -342
  463. package/skills/sophnet-schedule/src/apps/import_events.py +216 -216
  464. package/skills/sophnet-schedule/src/apps/monitor_calendar_changes.py +140 -140
  465. package/skills/sophnet-schedule/src/apps/register_tasks.py +169 -169
  466. package/skills/sophnet-schedule/src/apps/sync_roc_to_gcal.py +174 -174
  467. package/skills/sophnet-schedule/src/compat.py +66 -66
  468. package/skills/sophnet-schedule/src/config/reminder_rules.yaml +96 -96
  469. package/skills/sophnet-schedule/src/config/roc_events.yaml +44 -44
  470. package/skills/sophnet-schedule/src/config/settings.py +133 -133
  471. package/skills/sophnet-schedule/src/config/task_registry.yaml +92 -92
  472. package/skills/sophnet-schedule/src/docs/FRONTEND_INTEGRATION_GUIDE.md +437 -437
  473. package/skills/sophnet-schedule/src/gcal/client.py +374 -374
  474. package/skills/sophnet-schedule/src/gcal/models.py +91 -91
  475. package/skills/sophnet-schedule/src/requirements.txt +6 -6
  476. package/skills/sophnet-schedule/src/scripts/setup_gcal_token.py +85 -85
  477. package/skills/sophnet-schedule/src/server.py +669 -669
  478. package/skills/sophnet-schedule/src/services/calendar_backend.py +139 -139
  479. package/skills/sophnet-schedule/src/services/conflict_detector.py +96 -96
  480. package/skills/sophnet-schedule/src/services/datetime_utils.py +117 -117
  481. package/skills/sophnet-schedule/src/services/event_classifier.py +100 -100
  482. package/skills/sophnet-schedule/src/services/event_diff.py +160 -160
  483. package/skills/sophnet-schedule/src/services/google_integration.py +500 -500
  484. package/skills/sophnet-schedule/src/services/job_store.py +100 -100
  485. package/skills/sophnet-schedule/src/services/local_event_store.py +266 -266
  486. package/skills/sophnet-schedule/src/services/reminder_planner.py +116 -116
  487. package/skills/sophnet-schedule/src/services/runtime_utils.py +31 -31
  488. package/skills/sophnet-schedule/src/services/table_parser.py +286 -286
  489. package/skills/sophnet-schedule/src/services/task_builder.py +167 -167
  490. package/skills/sophnet-schedule/src/services/time_window.py +72 -72
  491. package/skills/sophnet-sticker-edit/skill.json +27 -27
  492. package/skills/sophnet-sticker-edit/src/SKILL.md +80 -80
  493. package/skills/sophnet-sticker-edit/src/pyproject.toml +9 -9
  494. package/skills/sophnet-sticker-edit/src/scripts/edit_sticker_image.py +403 -403
  495. package/skills/sophnet-stock/skill.json +20 -20
  496. package/skills/sophnet-stock/src/App-Plan.md +442 -442
  497. package/skills/sophnet-stock/src/README.md +214 -214
  498. package/skills/sophnet-stock/src/SKILL.md +236 -236
  499. package/skills/sophnet-stock/src/TODO.md +394 -394
  500. package/skills/sophnet-stock/src/_meta.json +5 -5
  501. package/skills/sophnet-stock/src/docs/ARCHITECTURE.md +408 -408
  502. package/skills/sophnet-stock/src/docs/CONCEPT.md +233 -233
  503. package/skills/sophnet-stock/src/docs/HOT_SCANNER.md +288 -288
  504. package/skills/sophnet-stock/src/docs/README.md +95 -95
  505. package/skills/sophnet-stock/src/docs/USAGE.md +465 -465
  506. package/skills/sophnet-stock/src/scripts/analyze_stock.py +2565 -2565
  507. package/skills/sophnet-stock/src/scripts/dividends.py +365 -365
  508. package/skills/sophnet-stock/src/scripts/hot_scanner.py +582 -582
  509. package/skills/sophnet-stock/src/scripts/portfolio.py +548 -548
  510. package/skills/sophnet-stock/src/scripts/rumor_scanner.py +342 -342
  511. package/skills/sophnet-stock/src/scripts/test_stock_analysis.py +409 -409
  512. package/skills/sophnet-stock/src/scripts/watchlist.py +336 -336
  513. package/skills/sophnet-training-install/skill.json +27 -27
  514. package/skills/sophnet-training-install/src/SKILL.md +211 -211
  515. package/skills/sophnet-training-install/src/pyproject.toml +6 -6
  516. package/skills/sophnet-training-install/src/scripts/backup_md.py +35 -35
  517. package/skills/sophnet-training-install/src/scripts/check_installed.py +144 -144
  518. package/skills/sophnet-training-install/src/scripts/update_config.py +142 -142
  519. package/skills/sophnet-training-install/src/scripts/update_md.py +73 -73
  520. package/skills/sophnet-tts/skill.json +20 -20
  521. package/skills/sophnet-tts/src/SKILL.md +79 -79
  522. package/skills/sophnet-tts/src/pyproject.toml +9 -9
  523. package/skills/sophnet-tts/src/scripts/gen_tts.py +130 -130
  524. package/skills/sophnet-video-generate/skill.json +37 -37
  525. package/skills/sophnet-video-generate/src/SKILL.md +117 -117
  526. package/skills/sophnet-video-generate/src/scripts/gen_video.py +321 -321
  527. package/skills/sophnet-xlsx/skill.json +20 -20
  528. package/skills/sophnet-xlsx/src/SKILL.md +399 -399
  529. package/skills/sophnet-xlsx/src/pyproject.toml +11 -11
  530. package/skills/sophnet-xlsx/src/scripts/ensure_uv_env.sh +68 -68
  531. package/skills/sophnet-xlsx/src/scripts/office/helpers/merge_runs.py +199 -199
  532. package/skills/sophnet-xlsx/src/scripts/office/helpers/simplify_redlines.py +197 -197
  533. package/skills/sophnet-xlsx/src/scripts/office/pack.py +159 -159
  534. package/skills/sophnet-xlsx/src/scripts/office/schemas/ISO-IEC29500-4_2016/dml-chart.xsd +1499 -1499
  535. package/skills/sophnet-xlsx/src/scripts/office/schemas/ISO-IEC29500-4_2016/dml-chartDrawing.xsd +146 -146
  536. package/skills/sophnet-xlsx/src/scripts/office/schemas/ISO-IEC29500-4_2016/dml-diagram.xsd +1085 -1085
  537. package/skills/sophnet-xlsx/src/scripts/office/schemas/ISO-IEC29500-4_2016/dml-lockedCanvas.xsd +11 -11
  538. package/skills/sophnet-xlsx/src/scripts/office/schemas/ISO-IEC29500-4_2016/dml-main.xsd +3081 -3081
  539. package/skills/sophnet-xlsx/src/scripts/office/schemas/ISO-IEC29500-4_2016/dml-picture.xsd +23 -23
  540. package/skills/sophnet-xlsx/src/scripts/office/schemas/ISO-IEC29500-4_2016/dml-spreadsheetDrawing.xsd +185 -185
  541. package/skills/sophnet-xlsx/src/scripts/office/schemas/ISO-IEC29500-4_2016/dml-wordprocessingDrawing.xsd +287 -287
  542. package/skills/sophnet-xlsx/src/scripts/office/schemas/ISO-IEC29500-4_2016/pml.xsd +1676 -1676
  543. package/skills/sophnet-xlsx/src/scripts/office/schemas/ISO-IEC29500-4_2016/shared-additionalCharacteristics.xsd +28 -28
  544. package/skills/sophnet-xlsx/src/scripts/office/schemas/ISO-IEC29500-4_2016/shared-bibliography.xsd +144 -144
  545. package/skills/sophnet-xlsx/src/scripts/office/schemas/ISO-IEC29500-4_2016/shared-commonSimpleTypes.xsd +174 -174
  546. package/skills/sophnet-xlsx/src/scripts/office/schemas/ISO-IEC29500-4_2016/shared-customXmlDataProperties.xsd +25 -25
  547. package/skills/sophnet-xlsx/src/scripts/office/schemas/ISO-IEC29500-4_2016/shared-customXmlSchemaProperties.xsd +18 -18
  548. package/skills/sophnet-xlsx/src/scripts/office/schemas/ISO-IEC29500-4_2016/shared-documentPropertiesCustom.xsd +59 -59
  549. package/skills/sophnet-xlsx/src/scripts/office/schemas/ISO-IEC29500-4_2016/shared-documentPropertiesExtended.xsd +56 -56
  550. package/skills/sophnet-xlsx/src/scripts/office/schemas/ISO-IEC29500-4_2016/shared-documentPropertiesVariantTypes.xsd +195 -195
  551. package/skills/sophnet-xlsx/src/scripts/office/schemas/ISO-IEC29500-4_2016/shared-math.xsd +582 -582
  552. package/skills/sophnet-xlsx/src/scripts/office/schemas/ISO-IEC29500-4_2016/shared-relationshipReference.xsd +25 -25
  553. package/skills/sophnet-xlsx/src/scripts/office/schemas/ISO-IEC29500-4_2016/sml.xsd +4439 -4439
  554. package/skills/sophnet-xlsx/src/scripts/office/schemas/ISO-IEC29500-4_2016/vml-main.xsd +570 -570
  555. package/skills/sophnet-xlsx/src/scripts/office/schemas/ISO-IEC29500-4_2016/vml-officeDrawing.xsd +509 -509
  556. package/skills/sophnet-xlsx/src/scripts/office/schemas/ISO-IEC29500-4_2016/vml-presentationDrawing.xsd +12 -12
  557. package/skills/sophnet-xlsx/src/scripts/office/schemas/ISO-IEC29500-4_2016/vml-spreadsheetDrawing.xsd +108 -108
  558. package/skills/sophnet-xlsx/src/scripts/office/schemas/ISO-IEC29500-4_2016/vml-wordprocessingDrawing.xsd +96 -96
  559. package/skills/sophnet-xlsx/src/scripts/office/schemas/ISO-IEC29500-4_2016/wml.xsd +3646 -3646
  560. package/skills/sophnet-xlsx/src/scripts/office/schemas/ISO-IEC29500-4_2016/xml.xsd +116 -116
  561. package/skills/sophnet-xlsx/src/scripts/office/schemas/ecma/fouth-edition/opc-contentTypes.xsd +42 -42
  562. package/skills/sophnet-xlsx/src/scripts/office/schemas/ecma/fouth-edition/opc-coreProperties.xsd +50 -50
  563. package/skills/sophnet-xlsx/src/scripts/office/schemas/ecma/fouth-edition/opc-digSig.xsd +49 -49
  564. package/skills/sophnet-xlsx/src/scripts/office/schemas/ecma/fouth-edition/opc-relationships.xsd +33 -33
  565. package/skills/sophnet-xlsx/src/scripts/office/schemas/mce/mc.xsd +75 -75
  566. package/skills/sophnet-xlsx/src/scripts/office/schemas/microsoft/wml-2010.xsd +560 -560
  567. package/skills/sophnet-xlsx/src/scripts/office/schemas/microsoft/wml-2012.xsd +67 -67
  568. package/skills/sophnet-xlsx/src/scripts/office/schemas/microsoft/wml-2018.xsd +14 -14
  569. package/skills/sophnet-xlsx/src/scripts/office/schemas/microsoft/wml-cex-2018.xsd +20 -20
  570. package/skills/sophnet-xlsx/src/scripts/office/schemas/microsoft/wml-cid-2016.xsd +13 -13
  571. package/skills/sophnet-xlsx/src/scripts/office/schemas/microsoft/wml-sdtdatahash-2020.xsd +4 -4
  572. package/skills/sophnet-xlsx/src/scripts/office/schemas/microsoft/wml-symex-2015.xsd +8 -8
  573. package/skills/sophnet-xlsx/src/scripts/office/soffice.py +183 -183
  574. package/skills/sophnet-xlsx/src/scripts/office/unpack.py +132 -132
  575. package/skills/sophnet-xlsx/src/scripts/office/validate.py +111 -111
  576. package/skills/sophnet-xlsx/src/scripts/office/validators/__init__.py +15 -15
  577. package/skills/sophnet-xlsx/src/scripts/office/validators/base.py +847 -847
  578. package/skills/sophnet-xlsx/src/scripts/office/validators/docx.py +446 -446
  579. package/skills/sophnet-xlsx/src/scripts/office/validators/pptx.py +275 -275
  580. package/skills/sophnet-xlsx/src/scripts/office/validators/redlining.py +247 -247
  581. package/skills/sophnet-xlsx/src/scripts/recalc.py +184 -184
  582. package/skills/sophnet-xlsx/src/scripts/upload_file.sh +96 -96
  583. package/skills/sophnet-xlsx/src/uv.lock +319 -319
  584. package/skills/ui-ux-pro-max/skill.json +20 -20
  585. package/skills/ui-ux-pro-max/src/SKILL.md +377 -377
  586. package/skills/ui-ux-pro-max/src/data/icons.csv +101 -101
  587. package/skills/ui-ux-pro-max/src/data/react-performance.csv +45 -45
  588. package/skills/ui-ux-pro-max/src/data/stacks/astro.csv +54 -54
  589. package/skills/ui-ux-pro-max/src/data/stacks/jetpack-compose.csv +53 -53
  590. package/skills/ui-ux-pro-max/src/data/stacks/nuxt-ui.csv +51 -51
  591. package/skills/ui-ux-pro-max/src/data/stacks/nuxtjs.csv +59 -59
  592. package/skills/ui-ux-pro-max/src/data/stacks/shadcn.csv +61 -61
  593. package/skills/ui-ux-pro-max/src/data/typography.csv +57 -57
  594. package/skills/ui-ux-pro-max/src/data/ui-reasoning.csv +101 -101
  595. package/skills/ui-ux-pro-max/src/data/web-interface.csv +31 -31
  596. package/skills/ui-ux-pro-max/src/scripts/core.py +253 -253
  597. package/skills/ui-ux-pro-max/src/scripts/design_system.py +1067 -1067
  598. package/skills/video-understand/skill.json +20 -20
  599. package/skills/video-understand/src/SKILL.md +79 -79
  600. package/skills/video-understand/src/scripts/video_understand.py +204 -204
  601. package/skills/weather/skill.json +19 -19
  602. package/skills/weather/src/SKILL.md +112 -112
  603. package/skills/web-scraper/skill.json +20 -20
  604. package/skills/web-scraper/src/SKILL.md +101 -101
  605. package/skills/web-scraper/src/scripts/scrape.py +270 -270
  606. package/skills/website-builder/skill.json +20 -20
  607. package/skills/website-builder/src/SKILL.md +266 -266
  608. package/skills/website-builder/src/scripts/deploy_site.sh +46 -46
  609. package/skills/wechat-article-publisher/skill.json +20 -20
  610. package/skills/wechat-article-publisher/src/SKILL.md +60 -60
  611. package/skills/wechat-article-publisher/src/config.json +6 -6
  612. package/skills/wechat-article-publisher/src/pyproject.toml +12 -12
  613. package/skills/wechat-article-publisher/src/scripts/publish_wechat.py +825 -825
  614. package/skills/xiaohongshu/skill.json +20 -20
  615. package/skills/xiaohongshu/src/SKILL.md +91 -91
  616. package/skills/xiaohongshu/src/_meta.json +5 -5
  617. package/skills/xiaohongshu/src/assets/card.html +216 -216
  618. package/skills/xiaohongshu/src/assets/cover.html +82 -82
  619. package/skills/xiaohongshu/src/assets/example.md +84 -84
  620. package/skills/xiaohongshu/src/assets/styles.css +318 -318
  621. package/skills/xiaohongshu/src/scripts/render_xhs_v2.py +737 -737
  622. package/skills/xiaohongshu/src/scripts/sign_server.py +158 -158
  623. package/skills/xiaohongshu/src/scripts/stealth.min.js +6 -6
  624. package/skills/xiaohongshu/src/scripts/xhs_tool.py +186 -186
  625. package/skills/xiaohongshu/src/workflow.py +185 -185
  626. package/src/commands/agent.js +112 -112
  627. package/src/commands/download.js +101 -101
  628. package/src/commands/info.js +58 -58
  629. package/src/commands/list.js +71 -71
  630. package/src/utils/agents.js +36 -36
  631. package/src/utils/config.js +22 -22
  632. package/src/utils/paths.js +31 -31
  633. package/src/utils/versions.js +57 -57
@@ -1,847 +1,847 @@
1
- """
2
- Base validator with common validation logic for document files.
3
- """
4
-
5
- import re
6
- from pathlib import Path
7
-
8
- import defusedxml.minidom
9
- import lxml.etree
10
-
11
-
12
- class BaseSchemaValidator:
13
-
14
- IGNORED_VALIDATION_ERRORS = [
15
- "hyphenationZone",
16
- "purl.org/dc/terms",
17
- ]
18
-
19
- UNIQUE_ID_REQUIREMENTS = {
20
- "comment": ("id", "file"),
21
- "commentrangestart": ("id", "file"),
22
- "commentrangeend": ("id", "file"),
23
- "bookmarkstart": ("id", "file"),
24
- "bookmarkend": ("id", "file"),
25
- "sldid": ("id", "file"),
26
- "sldmasterid": ("id", "global"),
27
- "sldlayoutid": ("id", "global"),
28
- "cm": ("authorid", "file"),
29
- "sheet": ("sheetid", "file"),
30
- "definedname": ("id", "file"),
31
- "cxnsp": ("id", "file"),
32
- "sp": ("id", "file"),
33
- "pic": ("id", "file"),
34
- "grpsp": ("id", "file"),
35
- }
36
-
37
- EXCLUDED_ID_CONTAINERS = {
38
- "sectionlst",
39
- }
40
-
41
- ELEMENT_RELATIONSHIP_TYPES = {}
42
-
43
- SCHEMA_MAPPINGS = {
44
- "word": "ISO-IEC29500-4_2016/wml.xsd",
45
- "ppt": "ISO-IEC29500-4_2016/pml.xsd",
46
- "xl": "ISO-IEC29500-4_2016/sml.xsd",
47
- "[Content_Types].xml": "ecma/fouth-edition/opc-contentTypes.xsd",
48
- "app.xml": "ISO-IEC29500-4_2016/shared-documentPropertiesExtended.xsd",
49
- "core.xml": "ecma/fouth-edition/opc-coreProperties.xsd",
50
- "custom.xml": "ISO-IEC29500-4_2016/shared-documentPropertiesCustom.xsd",
51
- ".rels": "ecma/fouth-edition/opc-relationships.xsd",
52
- "people.xml": "microsoft/wml-2012.xsd",
53
- "commentsIds.xml": "microsoft/wml-cid-2016.xsd",
54
- "commentsExtensible.xml": "microsoft/wml-cex-2018.xsd",
55
- "commentsExtended.xml": "microsoft/wml-2012.xsd",
56
- "chart": "ISO-IEC29500-4_2016/dml-chart.xsd",
57
- "theme": "ISO-IEC29500-4_2016/dml-main.xsd",
58
- "drawing": "ISO-IEC29500-4_2016/dml-main.xsd",
59
- }
60
-
61
- MC_NAMESPACE = "http://schemas.openxmlformats.org/markup-compatibility/2006"
62
- XML_NAMESPACE = "http://www.w3.org/XML/1998/namespace"
63
-
64
- PACKAGE_RELATIONSHIPS_NAMESPACE = (
65
- "http://schemas.openxmlformats.org/package/2006/relationships"
66
- )
67
- OFFICE_RELATIONSHIPS_NAMESPACE = (
68
- "http://schemas.openxmlformats.org/officeDocument/2006/relationships"
69
- )
70
- CONTENT_TYPES_NAMESPACE = (
71
- "http://schemas.openxmlformats.org/package/2006/content-types"
72
- )
73
-
74
- MAIN_CONTENT_FOLDERS = {"word", "ppt", "xl"}
75
-
76
- OOXML_NAMESPACES = {
77
- "http://schemas.openxmlformats.org/officeDocument/2006/math",
78
- "http://schemas.openxmlformats.org/officeDocument/2006/relationships",
79
- "http://schemas.openxmlformats.org/schemaLibrary/2006/main",
80
- "http://schemas.openxmlformats.org/drawingml/2006/main",
81
- "http://schemas.openxmlformats.org/drawingml/2006/chart",
82
- "http://schemas.openxmlformats.org/drawingml/2006/chartDrawing",
83
- "http://schemas.openxmlformats.org/drawingml/2006/diagram",
84
- "http://schemas.openxmlformats.org/drawingml/2006/picture",
85
- "http://schemas.openxmlformats.org/drawingml/2006/spreadsheetDrawing",
86
- "http://schemas.openxmlformats.org/drawingml/2006/wordprocessingDrawing",
87
- "http://schemas.openxmlformats.org/wordprocessingml/2006/main",
88
- "http://schemas.openxmlformats.org/presentationml/2006/main",
89
- "http://schemas.openxmlformats.org/spreadsheetml/2006/main",
90
- "http://schemas.openxmlformats.org/officeDocument/2006/sharedTypes",
91
- "http://www.w3.org/XML/1998/namespace",
92
- }
93
-
94
- def __init__(self, unpacked_dir, original_file=None, verbose=False):
95
- self.unpacked_dir = Path(unpacked_dir).resolve()
96
- self.original_file = Path(original_file) if original_file else None
97
- self.verbose = verbose
98
-
99
- self.schemas_dir = Path(__file__).parent.parent / "schemas"
100
-
101
- patterns = ["*.xml", "*.rels"]
102
- self.xml_files = [
103
- f for pattern in patterns for f in self.unpacked_dir.rglob(pattern)
104
- ]
105
-
106
- if not self.xml_files:
107
- print(f"Warning: No XML files found in {self.unpacked_dir}")
108
-
109
- def validate(self):
110
- raise NotImplementedError("Subclasses must implement the validate method")
111
-
112
- def repair(self) -> int:
113
- return self.repair_whitespace_preservation()
114
-
115
- def repair_whitespace_preservation(self) -> int:
116
- repairs = 0
117
-
118
- for xml_file in self.xml_files:
119
- try:
120
- content = xml_file.read_text(encoding="utf-8")
121
- dom = defusedxml.minidom.parseString(content)
122
- modified = False
123
-
124
- for elem in dom.getElementsByTagName("*"):
125
- if elem.tagName.endswith(":t") and elem.firstChild:
126
- text = elem.firstChild.nodeValue
127
- if text and (text.startswith((' ', '\t')) or text.endswith((' ', '\t'))):
128
- if elem.getAttribute("xml:space") != "preserve":
129
- elem.setAttribute("xml:space", "preserve")
130
- text_preview = repr(text[:30]) + "..." if len(text) > 30 else repr(text)
131
- print(f" Repaired: {xml_file.name}: Added xml:space='preserve' to {elem.tagName}: {text_preview}")
132
- repairs += 1
133
- modified = True
134
-
135
- if modified:
136
- xml_file.write_bytes(dom.toxml(encoding="UTF-8"))
137
-
138
- except Exception:
139
- pass
140
-
141
- return repairs
142
-
143
- def validate_xml(self):
144
- errors = []
145
-
146
- for xml_file in self.xml_files:
147
- try:
148
- lxml.etree.parse(str(xml_file))
149
- except lxml.etree.XMLSyntaxError as e:
150
- errors.append(
151
- f" {xml_file.relative_to(self.unpacked_dir)}: "
152
- f"Line {e.lineno}: {e.msg}"
153
- )
154
- except Exception as e:
155
- errors.append(
156
- f" {xml_file.relative_to(self.unpacked_dir)}: "
157
- f"Unexpected error: {str(e)}"
158
- )
159
-
160
- if errors:
161
- print(f"FAILED - Found {len(errors)} XML violations:")
162
- for error in errors:
163
- print(error)
164
- return False
165
- else:
166
- if self.verbose:
167
- print("PASSED - All XML files are well-formed")
168
- return True
169
-
170
- def validate_namespaces(self):
171
- errors = []
172
-
173
- for xml_file in self.xml_files:
174
- try:
175
- root = lxml.etree.parse(str(xml_file)).getroot()
176
- declared = set(root.nsmap.keys()) - {None}
177
-
178
- for attr_val in [
179
- v for k, v in root.attrib.items() if k.endswith("Ignorable")
180
- ]:
181
- undeclared = set(attr_val.split()) - declared
182
- errors.extend(
183
- f" {xml_file.relative_to(self.unpacked_dir)}: "
184
- f"Namespace '{ns}' in Ignorable but not declared"
185
- for ns in undeclared
186
- )
187
- except lxml.etree.XMLSyntaxError:
188
- continue
189
-
190
- if errors:
191
- print(f"FAILED - {len(errors)} namespace issues:")
192
- for error in errors:
193
- print(error)
194
- return False
195
- if self.verbose:
196
- print("PASSED - All namespace prefixes properly declared")
197
- return True
198
-
199
- def validate_unique_ids(self):
200
- errors = []
201
- global_ids = {}
202
-
203
- for xml_file in self.xml_files:
204
- try:
205
- root = lxml.etree.parse(str(xml_file)).getroot()
206
- file_ids = {}
207
-
208
- mc_elements = root.xpath(
209
- ".//mc:AlternateContent", namespaces={"mc": self.MC_NAMESPACE}
210
- )
211
- for elem in mc_elements:
212
- elem.getparent().remove(elem)
213
-
214
- for elem in root.iter():
215
- tag = (
216
- elem.tag.split("}")[-1].lower()
217
- if "}" in elem.tag
218
- else elem.tag.lower()
219
- )
220
-
221
- if tag in self.UNIQUE_ID_REQUIREMENTS:
222
- in_excluded_container = any(
223
- ancestor.tag.split("}")[-1].lower() in self.EXCLUDED_ID_CONTAINERS
224
- for ancestor in elem.iterancestors()
225
- )
226
- if in_excluded_container:
227
- continue
228
-
229
- attr_name, scope = self.UNIQUE_ID_REQUIREMENTS[tag]
230
-
231
- id_value = None
232
- for attr, value in elem.attrib.items():
233
- attr_local = (
234
- attr.split("}")[-1].lower()
235
- if "}" in attr
236
- else attr.lower()
237
- )
238
- if attr_local == attr_name:
239
- id_value = value
240
- break
241
-
242
- if id_value is not None:
243
- if scope == "global":
244
- if id_value in global_ids:
245
- prev_file, prev_line, prev_tag = global_ids[
246
- id_value
247
- ]
248
- errors.append(
249
- f" {xml_file.relative_to(self.unpacked_dir)}: "
250
- f"Line {elem.sourceline}: Global ID '{id_value}' in <{tag}> "
251
- f"already used in {prev_file} at line {prev_line} in <{prev_tag}>"
252
- )
253
- else:
254
- global_ids[id_value] = (
255
- xml_file.relative_to(self.unpacked_dir),
256
- elem.sourceline,
257
- tag,
258
- )
259
- elif scope == "file":
260
- key = (tag, attr_name)
261
- if key not in file_ids:
262
- file_ids[key] = {}
263
-
264
- if id_value in file_ids[key]:
265
- prev_line = file_ids[key][id_value]
266
- errors.append(
267
- f" {xml_file.relative_to(self.unpacked_dir)}: "
268
- f"Line {elem.sourceline}: Duplicate {attr_name}='{id_value}' in <{tag}> "
269
- f"(first occurrence at line {prev_line})"
270
- )
271
- else:
272
- file_ids[key][id_value] = elem.sourceline
273
-
274
- except (lxml.etree.XMLSyntaxError, Exception) as e:
275
- errors.append(
276
- f" {xml_file.relative_to(self.unpacked_dir)}: Error: {e}"
277
- )
278
-
279
- if errors:
280
- print(f"FAILED - Found {len(errors)} ID uniqueness violations:")
281
- for error in errors:
282
- print(error)
283
- return False
284
- else:
285
- if self.verbose:
286
- print("PASSED - All required IDs are unique")
287
- return True
288
-
289
- def validate_file_references(self):
290
- errors = []
291
-
292
- rels_files = list(self.unpacked_dir.rglob("*.rels"))
293
-
294
- if not rels_files:
295
- if self.verbose:
296
- print("PASSED - No .rels files found")
297
- return True
298
-
299
- all_files = []
300
- for file_path in self.unpacked_dir.rglob("*"):
301
- if (
302
- file_path.is_file()
303
- and file_path.name != "[Content_Types].xml"
304
- and not file_path.name.endswith(".rels")
305
- ):
306
- all_files.append(file_path.resolve())
307
-
308
- all_referenced_files = set()
309
-
310
- if self.verbose:
311
- print(
312
- f"Found {len(rels_files)} .rels files and {len(all_files)} target files"
313
- )
314
-
315
- for rels_file in rels_files:
316
- try:
317
- rels_root = lxml.etree.parse(str(rels_file)).getroot()
318
-
319
- rels_dir = rels_file.parent
320
-
321
- referenced_files = set()
322
- broken_refs = []
323
-
324
- for rel in rels_root.findall(
325
- ".//ns:Relationship",
326
- namespaces={"ns": self.PACKAGE_RELATIONSHIPS_NAMESPACE},
327
- ):
328
- target = rel.get("Target")
329
- if target and not target.startswith(
330
- ("http", "mailto:")
331
- ):
332
- if target.startswith("/"):
333
- target_path = self.unpacked_dir / target.lstrip("/")
334
- elif rels_file.name == ".rels":
335
- target_path = self.unpacked_dir / target
336
- else:
337
- base_dir = rels_dir.parent
338
- target_path = base_dir / target
339
-
340
- try:
341
- target_path = target_path.resolve()
342
- if target_path.exists() and target_path.is_file():
343
- referenced_files.add(target_path)
344
- all_referenced_files.add(target_path)
345
- else:
346
- broken_refs.append((target, rel.sourceline))
347
- except (OSError, ValueError):
348
- broken_refs.append((target, rel.sourceline))
349
-
350
- if broken_refs:
351
- rel_path = rels_file.relative_to(self.unpacked_dir)
352
- for broken_ref, line_num in broken_refs:
353
- errors.append(
354
- f" {rel_path}: Line {line_num}: Broken reference to {broken_ref}"
355
- )
356
-
357
- except Exception as e:
358
- rel_path = rels_file.relative_to(self.unpacked_dir)
359
- errors.append(f" Error parsing {rel_path}: {e}")
360
-
361
- unreferenced_files = set(all_files) - all_referenced_files
362
-
363
- if unreferenced_files:
364
- for unref_file in sorted(unreferenced_files):
365
- unref_rel_path = unref_file.relative_to(self.unpacked_dir)
366
- errors.append(f" Unreferenced file: {unref_rel_path}")
367
-
368
- if errors:
369
- print(f"FAILED - Found {len(errors)} relationship validation errors:")
370
- for error in errors:
371
- print(error)
372
- print(
373
- "CRITICAL: These errors will cause the document to appear corrupt. "
374
- + "Broken references MUST be fixed, "
375
- + "and unreferenced files MUST be referenced or removed."
376
- )
377
- return False
378
- else:
379
- if self.verbose:
380
- print(
381
- "PASSED - All references are valid and all files are properly referenced"
382
- )
383
- return True
384
-
385
- def validate_all_relationship_ids(self):
386
- import lxml.etree
387
-
388
- errors = []
389
-
390
- for xml_file in self.xml_files:
391
- if xml_file.suffix == ".rels":
392
- continue
393
-
394
- rels_dir = xml_file.parent / "_rels"
395
- rels_file = rels_dir / f"{xml_file.name}.rels"
396
-
397
- if not rels_file.exists():
398
- continue
399
-
400
- try:
401
- rels_root = lxml.etree.parse(str(rels_file)).getroot()
402
- rid_to_type = {}
403
-
404
- for rel in rels_root.findall(
405
- f".//{{{self.PACKAGE_RELATIONSHIPS_NAMESPACE}}}Relationship"
406
- ):
407
- rid = rel.get("Id")
408
- rel_type = rel.get("Type", "")
409
- if rid:
410
- if rid in rid_to_type:
411
- rels_rel_path = rels_file.relative_to(self.unpacked_dir)
412
- errors.append(
413
- f" {rels_rel_path}: Line {rel.sourceline}: "
414
- f"Duplicate relationship ID '{rid}' (IDs must be unique)"
415
- )
416
- type_name = (
417
- rel_type.split("/")[-1] if "/" in rel_type else rel_type
418
- )
419
- rid_to_type[rid] = type_name
420
-
421
- xml_root = lxml.etree.parse(str(xml_file)).getroot()
422
-
423
- r_ns = self.OFFICE_RELATIONSHIPS_NAMESPACE
424
- rid_attrs_to_check = ["id", "embed", "link"]
425
- for elem in xml_root.iter():
426
- for attr_name in rid_attrs_to_check:
427
- rid_attr = elem.get(f"{{{r_ns}}}{attr_name}")
428
- if not rid_attr:
429
- continue
430
- xml_rel_path = xml_file.relative_to(self.unpacked_dir)
431
- elem_name = (
432
- elem.tag.split("}")[-1] if "}" in elem.tag else elem.tag
433
- )
434
-
435
- if rid_attr not in rid_to_type:
436
- errors.append(
437
- f" {xml_rel_path}: Line {elem.sourceline}: "
438
- f"<{elem_name}> r:{attr_name} references non-existent relationship '{rid_attr}' "
439
- f"(valid IDs: {', '.join(sorted(rid_to_type.keys())[:5])}{'...' if len(rid_to_type) > 5 else ''})"
440
- )
441
- elif attr_name == "id" and self.ELEMENT_RELATIONSHIP_TYPES:
442
- expected_type = self._get_expected_relationship_type(
443
- elem_name
444
- )
445
- if expected_type:
446
- actual_type = rid_to_type[rid_attr]
447
- if expected_type not in actual_type.lower():
448
- errors.append(
449
- f" {xml_rel_path}: Line {elem.sourceline}: "
450
- f"<{elem_name}> references '{rid_attr}' which points to '{actual_type}' "
451
- f"but should point to a '{expected_type}' relationship"
452
- )
453
-
454
- except Exception as e:
455
- xml_rel_path = xml_file.relative_to(self.unpacked_dir)
456
- errors.append(f" Error processing {xml_rel_path}: {e}")
457
-
458
- if errors:
459
- print(f"FAILED - Found {len(errors)} relationship ID reference errors:")
460
- for error in errors:
461
- print(error)
462
- print("\nThese ID mismatches will cause the document to appear corrupt!")
463
- return False
464
- else:
465
- if self.verbose:
466
- print("PASSED - All relationship ID references are valid")
467
- return True
468
-
469
- def _get_expected_relationship_type(self, element_name):
470
- elem_lower = element_name.lower()
471
-
472
- if elem_lower in self.ELEMENT_RELATIONSHIP_TYPES:
473
- return self.ELEMENT_RELATIONSHIP_TYPES[elem_lower]
474
-
475
- if elem_lower.endswith("id") and len(elem_lower) > 2:
476
- prefix = elem_lower[:-2]
477
- if prefix.endswith("master"):
478
- return prefix.lower()
479
- elif prefix.endswith("layout"):
480
- return prefix.lower()
481
- else:
482
- if prefix == "sld":
483
- return "slide"
484
- return prefix.lower()
485
-
486
- if elem_lower.endswith("reference") and len(elem_lower) > 9:
487
- prefix = elem_lower[:-9]
488
- return prefix.lower()
489
-
490
- return None
491
-
492
- def validate_content_types(self):
493
- errors = []
494
-
495
- content_types_file = self.unpacked_dir / "[Content_Types].xml"
496
- if not content_types_file.exists():
497
- print("FAILED - [Content_Types].xml file not found")
498
- return False
499
-
500
- try:
501
- root = lxml.etree.parse(str(content_types_file)).getroot()
502
- declared_parts = set()
503
- declared_extensions = set()
504
-
505
- for override in root.findall(
506
- f".//{{{self.CONTENT_TYPES_NAMESPACE}}}Override"
507
- ):
508
- part_name = override.get("PartName")
509
- if part_name is not None:
510
- declared_parts.add(part_name.lstrip("/"))
511
-
512
- for default in root.findall(
513
- f".//{{{self.CONTENT_TYPES_NAMESPACE}}}Default"
514
- ):
515
- extension = default.get("Extension")
516
- if extension is not None:
517
- declared_extensions.add(extension.lower())
518
-
519
- declarable_roots = {
520
- "sld",
521
- "sldLayout",
522
- "sldMaster",
523
- "presentation",
524
- "document",
525
- "workbook",
526
- "worksheet",
527
- "theme",
528
- }
529
-
530
- media_extensions = {
531
- "png": "image/png",
532
- "jpg": "image/jpeg",
533
- "jpeg": "image/jpeg",
534
- "gif": "image/gif",
535
- "bmp": "image/bmp",
536
- "tiff": "image/tiff",
537
- "wmf": "image/x-wmf",
538
- "emf": "image/x-emf",
539
- }
540
-
541
- all_files = list(self.unpacked_dir.rglob("*"))
542
- all_files = [f for f in all_files if f.is_file()]
543
-
544
- for xml_file in self.xml_files:
545
- path_str = str(xml_file.relative_to(self.unpacked_dir)).replace(
546
- "\\", "/"
547
- )
548
-
549
- if any(
550
- skip in path_str
551
- for skip in [".rels", "[Content_Types]", "docProps/", "_rels/"]
552
- ):
553
- continue
554
-
555
- try:
556
- root_tag = lxml.etree.parse(str(xml_file)).getroot().tag
557
- root_name = root_tag.split("}")[-1] if "}" in root_tag else root_tag
558
-
559
- if root_name in declarable_roots and path_str not in declared_parts:
560
- errors.append(
561
- f" {path_str}: File with <{root_name}> root not declared in [Content_Types].xml"
562
- )
563
-
564
- except Exception:
565
- continue
566
-
567
- for file_path in all_files:
568
- if file_path.suffix.lower() in {".xml", ".rels"}:
569
- continue
570
- if file_path.name == "[Content_Types].xml":
571
- continue
572
- if "_rels" in file_path.parts or "docProps" in file_path.parts:
573
- continue
574
-
575
- extension = file_path.suffix.lstrip(".").lower()
576
- if extension and extension not in declared_extensions:
577
- if extension in media_extensions:
578
- relative_path = file_path.relative_to(self.unpacked_dir)
579
- errors.append(
580
- f' {relative_path}: File with extension \'{extension}\' not declared in [Content_Types].xml - should add: <Default Extension="{extension}" ContentType="{media_extensions[extension]}"/>'
581
- )
582
-
583
- except Exception as e:
584
- errors.append(f" Error parsing [Content_Types].xml: {e}")
585
-
586
- if errors:
587
- print(f"FAILED - Found {len(errors)} content type declaration errors:")
588
- for error in errors:
589
- print(error)
590
- return False
591
- else:
592
- if self.verbose:
593
- print(
594
- "PASSED - All content files are properly declared in [Content_Types].xml"
595
- )
596
- return True
597
-
598
- def validate_file_against_xsd(self, xml_file, verbose=False):
599
- xml_file = Path(xml_file).resolve()
600
- unpacked_dir = self.unpacked_dir.resolve()
601
-
602
- is_valid, current_errors = self._validate_single_file_xsd(
603
- xml_file, unpacked_dir
604
- )
605
-
606
- if is_valid is None:
607
- return None, set()
608
- elif is_valid:
609
- return True, set()
610
-
611
- original_errors = self._get_original_file_errors(xml_file)
612
-
613
- assert current_errors is not None
614
- new_errors = current_errors - original_errors
615
-
616
- new_errors = {
617
- e for e in new_errors
618
- if not any(pattern in e for pattern in self.IGNORED_VALIDATION_ERRORS)
619
- }
620
-
621
- if new_errors:
622
- if verbose:
623
- relative_path = xml_file.relative_to(unpacked_dir)
624
- print(f"FAILED - {relative_path}: {len(new_errors)} new error(s)")
625
- for error in list(new_errors)[:3]:
626
- truncated = error[:250] + "..." if len(error) > 250 else error
627
- print(f" - {truncated}")
628
- return False, new_errors
629
- else:
630
- if verbose:
631
- print(
632
- f"PASSED - No new errors (original had {len(current_errors)} errors)"
633
- )
634
- return True, set()
635
-
636
- def validate_against_xsd(self):
637
- new_errors = []
638
- original_error_count = 0
639
- valid_count = 0
640
- skipped_count = 0
641
-
642
- for xml_file in self.xml_files:
643
- relative_path = str(xml_file.relative_to(self.unpacked_dir))
644
- is_valid, new_file_errors = self.validate_file_against_xsd(
645
- xml_file, verbose=False
646
- )
647
-
648
- if is_valid is None:
649
- skipped_count += 1
650
- continue
651
- elif is_valid and not new_file_errors:
652
- valid_count += 1
653
- continue
654
- elif is_valid:
655
- original_error_count += 1
656
- valid_count += 1
657
- continue
658
-
659
- new_errors.append(f" {relative_path}: {len(new_file_errors)} new error(s)")
660
- for error in list(new_file_errors)[:3]:
661
- new_errors.append(
662
- f" - {error[:250]}..." if len(error) > 250 else f" - {error}"
663
- )
664
-
665
- if self.verbose:
666
- print(f"Validated {len(self.xml_files)} files:")
667
- print(f" - Valid: {valid_count}")
668
- print(f" - Skipped (no schema): {skipped_count}")
669
- if original_error_count:
670
- print(f" - With original errors (ignored): {original_error_count}")
671
- print(
672
- f" - With NEW errors: {len(new_errors) > 0 and len([e for e in new_errors if not e.startswith(' ')]) or 0}"
673
- )
674
-
675
- if new_errors:
676
- print("\nFAILED - Found NEW validation errors:")
677
- for error in new_errors:
678
- print(error)
679
- return False
680
- else:
681
- if self.verbose:
682
- print("\nPASSED - No new XSD validation errors introduced")
683
- return True
684
-
685
- def _get_schema_path(self, xml_file):
686
- if xml_file.name in self.SCHEMA_MAPPINGS:
687
- return self.schemas_dir / self.SCHEMA_MAPPINGS[xml_file.name]
688
-
689
- if xml_file.suffix == ".rels":
690
- return self.schemas_dir / self.SCHEMA_MAPPINGS[".rels"]
691
-
692
- if "charts/" in str(xml_file) and xml_file.name.startswith("chart"):
693
- return self.schemas_dir / self.SCHEMA_MAPPINGS["chart"]
694
-
695
- if "theme/" in str(xml_file) and xml_file.name.startswith("theme"):
696
- return self.schemas_dir / self.SCHEMA_MAPPINGS["theme"]
697
-
698
- if xml_file.parent.name in self.MAIN_CONTENT_FOLDERS:
699
- return self.schemas_dir / self.SCHEMA_MAPPINGS[xml_file.parent.name]
700
-
701
- return None
702
-
703
- def _clean_ignorable_namespaces(self, xml_doc):
704
- xml_string = lxml.etree.tostring(xml_doc, encoding="unicode")
705
- xml_copy = lxml.etree.fromstring(xml_string)
706
-
707
- for elem in xml_copy.iter():
708
- attrs_to_remove = []
709
-
710
- for attr in elem.attrib:
711
- if "{" in attr:
712
- ns = attr.split("}")[0][1:]
713
- if ns not in self.OOXML_NAMESPACES:
714
- attrs_to_remove.append(attr)
715
-
716
- for attr in attrs_to_remove:
717
- del elem.attrib[attr]
718
-
719
- self._remove_ignorable_elements(xml_copy)
720
-
721
- return lxml.etree.ElementTree(xml_copy)
722
-
723
- def _remove_ignorable_elements(self, root):
724
- elements_to_remove = []
725
-
726
- for elem in list(root):
727
- if not hasattr(elem, "tag") or callable(elem.tag):
728
- continue
729
-
730
- tag_str = str(elem.tag)
731
- if tag_str.startswith("{"):
732
- ns = tag_str.split("}")[0][1:]
733
- if ns not in self.OOXML_NAMESPACES:
734
- elements_to_remove.append(elem)
735
- continue
736
-
737
- self._remove_ignorable_elements(elem)
738
-
739
- for elem in elements_to_remove:
740
- root.remove(elem)
741
-
742
- def _preprocess_for_mc_ignorable(self, xml_doc):
743
- root = xml_doc.getroot()
744
-
745
- if f"{{{self.MC_NAMESPACE}}}Ignorable" in root.attrib:
746
- del root.attrib[f"{{{self.MC_NAMESPACE}}}Ignorable"]
747
-
748
- return xml_doc
749
-
750
- def _validate_single_file_xsd(self, xml_file, base_path):
751
- schema_path = self._get_schema_path(xml_file)
752
- if not schema_path:
753
- return None, None
754
-
755
- try:
756
- with open(schema_path, "rb") as xsd_file:
757
- parser = lxml.etree.XMLParser()
758
- xsd_doc = lxml.etree.parse(
759
- xsd_file, parser=parser, base_url=str(schema_path)
760
- )
761
- schema = lxml.etree.XMLSchema(xsd_doc)
762
-
763
- with open(xml_file, "r") as f:
764
- xml_doc = lxml.etree.parse(f)
765
-
766
- xml_doc, _ = self._remove_template_tags_from_text_nodes(xml_doc)
767
- xml_doc = self._preprocess_for_mc_ignorable(xml_doc)
768
-
769
- relative_path = xml_file.relative_to(base_path)
770
- if (
771
- relative_path.parts
772
- and relative_path.parts[0] in self.MAIN_CONTENT_FOLDERS
773
- ):
774
- xml_doc = self._clean_ignorable_namespaces(xml_doc)
775
-
776
- if schema.validate(xml_doc):
777
- return True, set()
778
- else:
779
- errors = set()
780
- for error in schema.error_log:
781
- errors.add(error.message)
782
- return False, errors
783
-
784
- except Exception as e:
785
- return False, {str(e)}
786
-
787
- def _get_original_file_errors(self, xml_file):
788
- if self.original_file is None:
789
- return set()
790
-
791
- import tempfile
792
- import zipfile
793
-
794
- xml_file = Path(xml_file).resolve()
795
- unpacked_dir = self.unpacked_dir.resolve()
796
- relative_path = xml_file.relative_to(unpacked_dir)
797
-
798
- with tempfile.TemporaryDirectory() as temp_dir:
799
- temp_path = Path(temp_dir)
800
-
801
- with zipfile.ZipFile(self.original_file, "r") as zip_ref:
802
- zip_ref.extractall(temp_path)
803
-
804
- original_xml_file = temp_path / relative_path
805
-
806
- if not original_xml_file.exists():
807
- return set()
808
-
809
- is_valid, errors = self._validate_single_file_xsd(
810
- original_xml_file, temp_path
811
- )
812
- return errors if errors else set()
813
-
814
- def _remove_template_tags_from_text_nodes(self, xml_doc):
815
- warnings = []
816
- template_pattern = re.compile(r"\{\{[^}]*\}\}")
817
-
818
- xml_string = lxml.etree.tostring(xml_doc, encoding="unicode")
819
- xml_copy = lxml.etree.fromstring(xml_string)
820
-
821
- def process_text_content(text, content_type):
822
- if not text:
823
- return text
824
- matches = list(template_pattern.finditer(text))
825
- if matches:
826
- for match in matches:
827
- warnings.append(
828
- f"Found template tag in {content_type}: {match.group()}"
829
- )
830
- return template_pattern.sub("", text)
831
- return text
832
-
833
- for elem in xml_copy.iter():
834
- if not hasattr(elem, "tag") or callable(elem.tag):
835
- continue
836
- tag_str = str(elem.tag)
837
- if tag_str.endswith("}t") or tag_str == "t":
838
- continue
839
-
840
- elem.text = process_text_content(elem.text, "text content")
841
- elem.tail = process_text_content(elem.tail, "tail content")
842
-
843
- return lxml.etree.ElementTree(xml_copy), warnings
844
-
845
-
846
- if __name__ == "__main__":
847
- raise RuntimeError("This module should not be run directly.")
1
+ """
2
+ Base validator with common validation logic for document files.
3
+ """
4
+
5
+ import re
6
+ from pathlib import Path
7
+
8
+ import defusedxml.minidom
9
+ import lxml.etree
10
+
11
+
12
+ class BaseSchemaValidator:
13
+
14
+ IGNORED_VALIDATION_ERRORS = [
15
+ "hyphenationZone",
16
+ "purl.org/dc/terms",
17
+ ]
18
+
19
+ UNIQUE_ID_REQUIREMENTS = {
20
+ "comment": ("id", "file"),
21
+ "commentrangestart": ("id", "file"),
22
+ "commentrangeend": ("id", "file"),
23
+ "bookmarkstart": ("id", "file"),
24
+ "bookmarkend": ("id", "file"),
25
+ "sldid": ("id", "file"),
26
+ "sldmasterid": ("id", "global"),
27
+ "sldlayoutid": ("id", "global"),
28
+ "cm": ("authorid", "file"),
29
+ "sheet": ("sheetid", "file"),
30
+ "definedname": ("id", "file"),
31
+ "cxnsp": ("id", "file"),
32
+ "sp": ("id", "file"),
33
+ "pic": ("id", "file"),
34
+ "grpsp": ("id", "file"),
35
+ }
36
+
37
+ EXCLUDED_ID_CONTAINERS = {
38
+ "sectionlst",
39
+ }
40
+
41
+ ELEMENT_RELATIONSHIP_TYPES = {}
42
+
43
+ SCHEMA_MAPPINGS = {
44
+ "word": "ISO-IEC29500-4_2016/wml.xsd",
45
+ "ppt": "ISO-IEC29500-4_2016/pml.xsd",
46
+ "xl": "ISO-IEC29500-4_2016/sml.xsd",
47
+ "[Content_Types].xml": "ecma/fouth-edition/opc-contentTypes.xsd",
48
+ "app.xml": "ISO-IEC29500-4_2016/shared-documentPropertiesExtended.xsd",
49
+ "core.xml": "ecma/fouth-edition/opc-coreProperties.xsd",
50
+ "custom.xml": "ISO-IEC29500-4_2016/shared-documentPropertiesCustom.xsd",
51
+ ".rels": "ecma/fouth-edition/opc-relationships.xsd",
52
+ "people.xml": "microsoft/wml-2012.xsd",
53
+ "commentsIds.xml": "microsoft/wml-cid-2016.xsd",
54
+ "commentsExtensible.xml": "microsoft/wml-cex-2018.xsd",
55
+ "commentsExtended.xml": "microsoft/wml-2012.xsd",
56
+ "chart": "ISO-IEC29500-4_2016/dml-chart.xsd",
57
+ "theme": "ISO-IEC29500-4_2016/dml-main.xsd",
58
+ "drawing": "ISO-IEC29500-4_2016/dml-main.xsd",
59
+ }
60
+
61
+ MC_NAMESPACE = "http://schemas.openxmlformats.org/markup-compatibility/2006"
62
+ XML_NAMESPACE = "http://www.w3.org/XML/1998/namespace"
63
+
64
+ PACKAGE_RELATIONSHIPS_NAMESPACE = (
65
+ "http://schemas.openxmlformats.org/package/2006/relationships"
66
+ )
67
+ OFFICE_RELATIONSHIPS_NAMESPACE = (
68
+ "http://schemas.openxmlformats.org/officeDocument/2006/relationships"
69
+ )
70
+ CONTENT_TYPES_NAMESPACE = (
71
+ "http://schemas.openxmlformats.org/package/2006/content-types"
72
+ )
73
+
74
+ MAIN_CONTENT_FOLDERS = {"word", "ppt", "xl"}
75
+
76
+ OOXML_NAMESPACES = {
77
+ "http://schemas.openxmlformats.org/officeDocument/2006/math",
78
+ "http://schemas.openxmlformats.org/officeDocument/2006/relationships",
79
+ "http://schemas.openxmlformats.org/schemaLibrary/2006/main",
80
+ "http://schemas.openxmlformats.org/drawingml/2006/main",
81
+ "http://schemas.openxmlformats.org/drawingml/2006/chart",
82
+ "http://schemas.openxmlformats.org/drawingml/2006/chartDrawing",
83
+ "http://schemas.openxmlformats.org/drawingml/2006/diagram",
84
+ "http://schemas.openxmlformats.org/drawingml/2006/picture",
85
+ "http://schemas.openxmlformats.org/drawingml/2006/spreadsheetDrawing",
86
+ "http://schemas.openxmlformats.org/drawingml/2006/wordprocessingDrawing",
87
+ "http://schemas.openxmlformats.org/wordprocessingml/2006/main",
88
+ "http://schemas.openxmlformats.org/presentationml/2006/main",
89
+ "http://schemas.openxmlformats.org/spreadsheetml/2006/main",
90
+ "http://schemas.openxmlformats.org/officeDocument/2006/sharedTypes",
91
+ "http://www.w3.org/XML/1998/namespace",
92
+ }
93
+
94
+ def __init__(self, unpacked_dir, original_file=None, verbose=False):
95
+ self.unpacked_dir = Path(unpacked_dir).resolve()
96
+ self.original_file = Path(original_file) if original_file else None
97
+ self.verbose = verbose
98
+
99
+ self.schemas_dir = Path(__file__).parent.parent / "schemas"
100
+
101
+ patterns = ["*.xml", "*.rels"]
102
+ self.xml_files = [
103
+ f for pattern in patterns for f in self.unpacked_dir.rglob(pattern)
104
+ ]
105
+
106
+ if not self.xml_files:
107
+ print(f"Warning: No XML files found in {self.unpacked_dir}")
108
+
109
+ def validate(self):
110
+ raise NotImplementedError("Subclasses must implement the validate method")
111
+
112
+ def repair(self) -> int:
113
+ return self.repair_whitespace_preservation()
114
+
115
+ def repair_whitespace_preservation(self) -> int:
116
+ repairs = 0
117
+
118
+ for xml_file in self.xml_files:
119
+ try:
120
+ content = xml_file.read_text(encoding="utf-8")
121
+ dom = defusedxml.minidom.parseString(content)
122
+ modified = False
123
+
124
+ for elem in dom.getElementsByTagName("*"):
125
+ if elem.tagName.endswith(":t") and elem.firstChild:
126
+ text = elem.firstChild.nodeValue
127
+ if text and (text.startswith((' ', '\t')) or text.endswith((' ', '\t'))):
128
+ if elem.getAttribute("xml:space") != "preserve":
129
+ elem.setAttribute("xml:space", "preserve")
130
+ text_preview = repr(text[:30]) + "..." if len(text) > 30 else repr(text)
131
+ print(f" Repaired: {xml_file.name}: Added xml:space='preserve' to {elem.tagName}: {text_preview}")
132
+ repairs += 1
133
+ modified = True
134
+
135
+ if modified:
136
+ xml_file.write_bytes(dom.toxml(encoding="UTF-8"))
137
+
138
+ except Exception:
139
+ pass
140
+
141
+ return repairs
142
+
143
+ def validate_xml(self):
144
+ errors = []
145
+
146
+ for xml_file in self.xml_files:
147
+ try:
148
+ lxml.etree.parse(str(xml_file))
149
+ except lxml.etree.XMLSyntaxError as e:
150
+ errors.append(
151
+ f" {xml_file.relative_to(self.unpacked_dir)}: "
152
+ f"Line {e.lineno}: {e.msg}"
153
+ )
154
+ except Exception as e:
155
+ errors.append(
156
+ f" {xml_file.relative_to(self.unpacked_dir)}: "
157
+ f"Unexpected error: {str(e)}"
158
+ )
159
+
160
+ if errors:
161
+ print(f"FAILED - Found {len(errors)} XML violations:")
162
+ for error in errors:
163
+ print(error)
164
+ return False
165
+ else:
166
+ if self.verbose:
167
+ print("PASSED - All XML files are well-formed")
168
+ return True
169
+
170
+ def validate_namespaces(self):
171
+ errors = []
172
+
173
+ for xml_file in self.xml_files:
174
+ try:
175
+ root = lxml.etree.parse(str(xml_file)).getroot()
176
+ declared = set(root.nsmap.keys()) - {None}
177
+
178
+ for attr_val in [
179
+ v for k, v in root.attrib.items() if k.endswith("Ignorable")
180
+ ]:
181
+ undeclared = set(attr_val.split()) - declared
182
+ errors.extend(
183
+ f" {xml_file.relative_to(self.unpacked_dir)}: "
184
+ f"Namespace '{ns}' in Ignorable but not declared"
185
+ for ns in undeclared
186
+ )
187
+ except lxml.etree.XMLSyntaxError:
188
+ continue
189
+
190
+ if errors:
191
+ print(f"FAILED - {len(errors)} namespace issues:")
192
+ for error in errors:
193
+ print(error)
194
+ return False
195
+ if self.verbose:
196
+ print("PASSED - All namespace prefixes properly declared")
197
+ return True
198
+
199
+ def validate_unique_ids(self):
200
+ errors = []
201
+ global_ids = {}
202
+
203
+ for xml_file in self.xml_files:
204
+ try:
205
+ root = lxml.etree.parse(str(xml_file)).getroot()
206
+ file_ids = {}
207
+
208
+ mc_elements = root.xpath(
209
+ ".//mc:AlternateContent", namespaces={"mc": self.MC_NAMESPACE}
210
+ )
211
+ for elem in mc_elements:
212
+ elem.getparent().remove(elem)
213
+
214
+ for elem in root.iter():
215
+ tag = (
216
+ elem.tag.split("}")[-1].lower()
217
+ if "}" in elem.tag
218
+ else elem.tag.lower()
219
+ )
220
+
221
+ if tag in self.UNIQUE_ID_REQUIREMENTS:
222
+ in_excluded_container = any(
223
+ ancestor.tag.split("}")[-1].lower() in self.EXCLUDED_ID_CONTAINERS
224
+ for ancestor in elem.iterancestors()
225
+ )
226
+ if in_excluded_container:
227
+ continue
228
+
229
+ attr_name, scope = self.UNIQUE_ID_REQUIREMENTS[tag]
230
+
231
+ id_value = None
232
+ for attr, value in elem.attrib.items():
233
+ attr_local = (
234
+ attr.split("}")[-1].lower()
235
+ if "}" in attr
236
+ else attr.lower()
237
+ )
238
+ if attr_local == attr_name:
239
+ id_value = value
240
+ break
241
+
242
+ if id_value is not None:
243
+ if scope == "global":
244
+ if id_value in global_ids:
245
+ prev_file, prev_line, prev_tag = global_ids[
246
+ id_value
247
+ ]
248
+ errors.append(
249
+ f" {xml_file.relative_to(self.unpacked_dir)}: "
250
+ f"Line {elem.sourceline}: Global ID '{id_value}' in <{tag}> "
251
+ f"already used in {prev_file} at line {prev_line} in <{prev_tag}>"
252
+ )
253
+ else:
254
+ global_ids[id_value] = (
255
+ xml_file.relative_to(self.unpacked_dir),
256
+ elem.sourceline,
257
+ tag,
258
+ )
259
+ elif scope == "file":
260
+ key = (tag, attr_name)
261
+ if key not in file_ids:
262
+ file_ids[key] = {}
263
+
264
+ if id_value in file_ids[key]:
265
+ prev_line = file_ids[key][id_value]
266
+ errors.append(
267
+ f" {xml_file.relative_to(self.unpacked_dir)}: "
268
+ f"Line {elem.sourceline}: Duplicate {attr_name}='{id_value}' in <{tag}> "
269
+ f"(first occurrence at line {prev_line})"
270
+ )
271
+ else:
272
+ file_ids[key][id_value] = elem.sourceline
273
+
274
+ except (lxml.etree.XMLSyntaxError, Exception) as e:
275
+ errors.append(
276
+ f" {xml_file.relative_to(self.unpacked_dir)}: Error: {e}"
277
+ )
278
+
279
+ if errors:
280
+ print(f"FAILED - Found {len(errors)} ID uniqueness violations:")
281
+ for error in errors:
282
+ print(error)
283
+ return False
284
+ else:
285
+ if self.verbose:
286
+ print("PASSED - All required IDs are unique")
287
+ return True
288
+
289
+ def validate_file_references(self):
290
+ errors = []
291
+
292
+ rels_files = list(self.unpacked_dir.rglob("*.rels"))
293
+
294
+ if not rels_files:
295
+ if self.verbose:
296
+ print("PASSED - No .rels files found")
297
+ return True
298
+
299
+ all_files = []
300
+ for file_path in self.unpacked_dir.rglob("*"):
301
+ if (
302
+ file_path.is_file()
303
+ and file_path.name != "[Content_Types].xml"
304
+ and not file_path.name.endswith(".rels")
305
+ ):
306
+ all_files.append(file_path.resolve())
307
+
308
+ all_referenced_files = set()
309
+
310
+ if self.verbose:
311
+ print(
312
+ f"Found {len(rels_files)} .rels files and {len(all_files)} target files"
313
+ )
314
+
315
+ for rels_file in rels_files:
316
+ try:
317
+ rels_root = lxml.etree.parse(str(rels_file)).getroot()
318
+
319
+ rels_dir = rels_file.parent
320
+
321
+ referenced_files = set()
322
+ broken_refs = []
323
+
324
+ for rel in rels_root.findall(
325
+ ".//ns:Relationship",
326
+ namespaces={"ns": self.PACKAGE_RELATIONSHIPS_NAMESPACE},
327
+ ):
328
+ target = rel.get("Target")
329
+ if target and not target.startswith(
330
+ ("http", "mailto:")
331
+ ):
332
+ if target.startswith("/"):
333
+ target_path = self.unpacked_dir / target.lstrip("/")
334
+ elif rels_file.name == ".rels":
335
+ target_path = self.unpacked_dir / target
336
+ else:
337
+ base_dir = rels_dir.parent
338
+ target_path = base_dir / target
339
+
340
+ try:
341
+ target_path = target_path.resolve()
342
+ if target_path.exists() and target_path.is_file():
343
+ referenced_files.add(target_path)
344
+ all_referenced_files.add(target_path)
345
+ else:
346
+ broken_refs.append((target, rel.sourceline))
347
+ except (OSError, ValueError):
348
+ broken_refs.append((target, rel.sourceline))
349
+
350
+ if broken_refs:
351
+ rel_path = rels_file.relative_to(self.unpacked_dir)
352
+ for broken_ref, line_num in broken_refs:
353
+ errors.append(
354
+ f" {rel_path}: Line {line_num}: Broken reference to {broken_ref}"
355
+ )
356
+
357
+ except Exception as e:
358
+ rel_path = rels_file.relative_to(self.unpacked_dir)
359
+ errors.append(f" Error parsing {rel_path}: {e}")
360
+
361
+ unreferenced_files = set(all_files) - all_referenced_files
362
+
363
+ if unreferenced_files:
364
+ for unref_file in sorted(unreferenced_files):
365
+ unref_rel_path = unref_file.relative_to(self.unpacked_dir)
366
+ errors.append(f" Unreferenced file: {unref_rel_path}")
367
+
368
+ if errors:
369
+ print(f"FAILED - Found {len(errors)} relationship validation errors:")
370
+ for error in errors:
371
+ print(error)
372
+ print(
373
+ "CRITICAL: These errors will cause the document to appear corrupt. "
374
+ + "Broken references MUST be fixed, "
375
+ + "and unreferenced files MUST be referenced or removed."
376
+ )
377
+ return False
378
+ else:
379
+ if self.verbose:
380
+ print(
381
+ "PASSED - All references are valid and all files are properly referenced"
382
+ )
383
+ return True
384
+
385
+ def validate_all_relationship_ids(self):
386
+ import lxml.etree
387
+
388
+ errors = []
389
+
390
+ for xml_file in self.xml_files:
391
+ if xml_file.suffix == ".rels":
392
+ continue
393
+
394
+ rels_dir = xml_file.parent / "_rels"
395
+ rels_file = rels_dir / f"{xml_file.name}.rels"
396
+
397
+ if not rels_file.exists():
398
+ continue
399
+
400
+ try:
401
+ rels_root = lxml.etree.parse(str(rels_file)).getroot()
402
+ rid_to_type = {}
403
+
404
+ for rel in rels_root.findall(
405
+ f".//{{{self.PACKAGE_RELATIONSHIPS_NAMESPACE}}}Relationship"
406
+ ):
407
+ rid = rel.get("Id")
408
+ rel_type = rel.get("Type", "")
409
+ if rid:
410
+ if rid in rid_to_type:
411
+ rels_rel_path = rels_file.relative_to(self.unpacked_dir)
412
+ errors.append(
413
+ f" {rels_rel_path}: Line {rel.sourceline}: "
414
+ f"Duplicate relationship ID '{rid}' (IDs must be unique)"
415
+ )
416
+ type_name = (
417
+ rel_type.split("/")[-1] if "/" in rel_type else rel_type
418
+ )
419
+ rid_to_type[rid] = type_name
420
+
421
+ xml_root = lxml.etree.parse(str(xml_file)).getroot()
422
+
423
+ r_ns = self.OFFICE_RELATIONSHIPS_NAMESPACE
424
+ rid_attrs_to_check = ["id", "embed", "link"]
425
+ for elem in xml_root.iter():
426
+ for attr_name in rid_attrs_to_check:
427
+ rid_attr = elem.get(f"{{{r_ns}}}{attr_name}")
428
+ if not rid_attr:
429
+ continue
430
+ xml_rel_path = xml_file.relative_to(self.unpacked_dir)
431
+ elem_name = (
432
+ elem.tag.split("}")[-1] if "}" in elem.tag else elem.tag
433
+ )
434
+
435
+ if rid_attr not in rid_to_type:
436
+ errors.append(
437
+ f" {xml_rel_path}: Line {elem.sourceline}: "
438
+ f"<{elem_name}> r:{attr_name} references non-existent relationship '{rid_attr}' "
439
+ f"(valid IDs: {', '.join(sorted(rid_to_type.keys())[:5])}{'...' if len(rid_to_type) > 5 else ''})"
440
+ )
441
+ elif attr_name == "id" and self.ELEMENT_RELATIONSHIP_TYPES:
442
+ expected_type = self._get_expected_relationship_type(
443
+ elem_name
444
+ )
445
+ if expected_type:
446
+ actual_type = rid_to_type[rid_attr]
447
+ if expected_type not in actual_type.lower():
448
+ errors.append(
449
+ f" {xml_rel_path}: Line {elem.sourceline}: "
450
+ f"<{elem_name}> references '{rid_attr}' which points to '{actual_type}' "
451
+ f"but should point to a '{expected_type}' relationship"
452
+ )
453
+
454
+ except Exception as e:
455
+ xml_rel_path = xml_file.relative_to(self.unpacked_dir)
456
+ errors.append(f" Error processing {xml_rel_path}: {e}")
457
+
458
+ if errors:
459
+ print(f"FAILED - Found {len(errors)} relationship ID reference errors:")
460
+ for error in errors:
461
+ print(error)
462
+ print("\nThese ID mismatches will cause the document to appear corrupt!")
463
+ return False
464
+ else:
465
+ if self.verbose:
466
+ print("PASSED - All relationship ID references are valid")
467
+ return True
468
+
469
+ def _get_expected_relationship_type(self, element_name):
470
+ elem_lower = element_name.lower()
471
+
472
+ if elem_lower in self.ELEMENT_RELATIONSHIP_TYPES:
473
+ return self.ELEMENT_RELATIONSHIP_TYPES[elem_lower]
474
+
475
+ if elem_lower.endswith("id") and len(elem_lower) > 2:
476
+ prefix = elem_lower[:-2]
477
+ if prefix.endswith("master"):
478
+ return prefix.lower()
479
+ elif prefix.endswith("layout"):
480
+ return prefix.lower()
481
+ else:
482
+ if prefix == "sld":
483
+ return "slide"
484
+ return prefix.lower()
485
+
486
+ if elem_lower.endswith("reference") and len(elem_lower) > 9:
487
+ prefix = elem_lower[:-9]
488
+ return prefix.lower()
489
+
490
+ return None
491
+
492
+ def validate_content_types(self):
493
+ errors = []
494
+
495
+ content_types_file = self.unpacked_dir / "[Content_Types].xml"
496
+ if not content_types_file.exists():
497
+ print("FAILED - [Content_Types].xml file not found")
498
+ return False
499
+
500
+ try:
501
+ root = lxml.etree.parse(str(content_types_file)).getroot()
502
+ declared_parts = set()
503
+ declared_extensions = set()
504
+
505
+ for override in root.findall(
506
+ f".//{{{self.CONTENT_TYPES_NAMESPACE}}}Override"
507
+ ):
508
+ part_name = override.get("PartName")
509
+ if part_name is not None:
510
+ declared_parts.add(part_name.lstrip("/"))
511
+
512
+ for default in root.findall(
513
+ f".//{{{self.CONTENT_TYPES_NAMESPACE}}}Default"
514
+ ):
515
+ extension = default.get("Extension")
516
+ if extension is not None:
517
+ declared_extensions.add(extension.lower())
518
+
519
+ declarable_roots = {
520
+ "sld",
521
+ "sldLayout",
522
+ "sldMaster",
523
+ "presentation",
524
+ "document",
525
+ "workbook",
526
+ "worksheet",
527
+ "theme",
528
+ }
529
+
530
+ media_extensions = {
531
+ "png": "image/png",
532
+ "jpg": "image/jpeg",
533
+ "jpeg": "image/jpeg",
534
+ "gif": "image/gif",
535
+ "bmp": "image/bmp",
536
+ "tiff": "image/tiff",
537
+ "wmf": "image/x-wmf",
538
+ "emf": "image/x-emf",
539
+ }
540
+
541
+ all_files = list(self.unpacked_dir.rglob("*"))
542
+ all_files = [f for f in all_files if f.is_file()]
543
+
544
+ for xml_file in self.xml_files:
545
+ path_str = str(xml_file.relative_to(self.unpacked_dir)).replace(
546
+ "\\", "/"
547
+ )
548
+
549
+ if any(
550
+ skip in path_str
551
+ for skip in [".rels", "[Content_Types]", "docProps/", "_rels/"]
552
+ ):
553
+ continue
554
+
555
+ try:
556
+ root_tag = lxml.etree.parse(str(xml_file)).getroot().tag
557
+ root_name = root_tag.split("}")[-1] if "}" in root_tag else root_tag
558
+
559
+ if root_name in declarable_roots and path_str not in declared_parts:
560
+ errors.append(
561
+ f" {path_str}: File with <{root_name}> root not declared in [Content_Types].xml"
562
+ )
563
+
564
+ except Exception:
565
+ continue
566
+
567
+ for file_path in all_files:
568
+ if file_path.suffix.lower() in {".xml", ".rels"}:
569
+ continue
570
+ if file_path.name == "[Content_Types].xml":
571
+ continue
572
+ if "_rels" in file_path.parts or "docProps" in file_path.parts:
573
+ continue
574
+
575
+ extension = file_path.suffix.lstrip(".").lower()
576
+ if extension and extension not in declared_extensions:
577
+ if extension in media_extensions:
578
+ relative_path = file_path.relative_to(self.unpacked_dir)
579
+ errors.append(
580
+ f' {relative_path}: File with extension \'{extension}\' not declared in [Content_Types].xml - should add: <Default Extension="{extension}" ContentType="{media_extensions[extension]}"/>'
581
+ )
582
+
583
+ except Exception as e:
584
+ errors.append(f" Error parsing [Content_Types].xml: {e}")
585
+
586
+ if errors:
587
+ print(f"FAILED - Found {len(errors)} content type declaration errors:")
588
+ for error in errors:
589
+ print(error)
590
+ return False
591
+ else:
592
+ if self.verbose:
593
+ print(
594
+ "PASSED - All content files are properly declared in [Content_Types].xml"
595
+ )
596
+ return True
597
+
598
+ def validate_file_against_xsd(self, xml_file, verbose=False):
599
+ xml_file = Path(xml_file).resolve()
600
+ unpacked_dir = self.unpacked_dir.resolve()
601
+
602
+ is_valid, current_errors = self._validate_single_file_xsd(
603
+ xml_file, unpacked_dir
604
+ )
605
+
606
+ if is_valid is None:
607
+ return None, set()
608
+ elif is_valid:
609
+ return True, set()
610
+
611
+ original_errors = self._get_original_file_errors(xml_file)
612
+
613
+ assert current_errors is not None
614
+ new_errors = current_errors - original_errors
615
+
616
+ new_errors = {
617
+ e for e in new_errors
618
+ if not any(pattern in e for pattern in self.IGNORED_VALIDATION_ERRORS)
619
+ }
620
+
621
+ if new_errors:
622
+ if verbose:
623
+ relative_path = xml_file.relative_to(unpacked_dir)
624
+ print(f"FAILED - {relative_path}: {len(new_errors)} new error(s)")
625
+ for error in list(new_errors)[:3]:
626
+ truncated = error[:250] + "..." if len(error) > 250 else error
627
+ print(f" - {truncated}")
628
+ return False, new_errors
629
+ else:
630
+ if verbose:
631
+ print(
632
+ f"PASSED - No new errors (original had {len(current_errors)} errors)"
633
+ )
634
+ return True, set()
635
+
636
+ def validate_against_xsd(self):
637
+ new_errors = []
638
+ original_error_count = 0
639
+ valid_count = 0
640
+ skipped_count = 0
641
+
642
+ for xml_file in self.xml_files:
643
+ relative_path = str(xml_file.relative_to(self.unpacked_dir))
644
+ is_valid, new_file_errors = self.validate_file_against_xsd(
645
+ xml_file, verbose=False
646
+ )
647
+
648
+ if is_valid is None:
649
+ skipped_count += 1
650
+ continue
651
+ elif is_valid and not new_file_errors:
652
+ valid_count += 1
653
+ continue
654
+ elif is_valid:
655
+ original_error_count += 1
656
+ valid_count += 1
657
+ continue
658
+
659
+ new_errors.append(f" {relative_path}: {len(new_file_errors)} new error(s)")
660
+ for error in list(new_file_errors)[:3]:
661
+ new_errors.append(
662
+ f" - {error[:250]}..." if len(error) > 250 else f" - {error}"
663
+ )
664
+
665
+ if self.verbose:
666
+ print(f"Validated {len(self.xml_files)} files:")
667
+ print(f" - Valid: {valid_count}")
668
+ print(f" - Skipped (no schema): {skipped_count}")
669
+ if original_error_count:
670
+ print(f" - With original errors (ignored): {original_error_count}")
671
+ print(
672
+ f" - With NEW errors: {len(new_errors) > 0 and len([e for e in new_errors if not e.startswith(' ')]) or 0}"
673
+ )
674
+
675
+ if new_errors:
676
+ print("\nFAILED - Found NEW validation errors:")
677
+ for error in new_errors:
678
+ print(error)
679
+ return False
680
+ else:
681
+ if self.verbose:
682
+ print("\nPASSED - No new XSD validation errors introduced")
683
+ return True
684
+
685
+ def _get_schema_path(self, xml_file):
686
+ if xml_file.name in self.SCHEMA_MAPPINGS:
687
+ return self.schemas_dir / self.SCHEMA_MAPPINGS[xml_file.name]
688
+
689
+ if xml_file.suffix == ".rels":
690
+ return self.schemas_dir / self.SCHEMA_MAPPINGS[".rels"]
691
+
692
+ if "charts/" in str(xml_file) and xml_file.name.startswith("chart"):
693
+ return self.schemas_dir / self.SCHEMA_MAPPINGS["chart"]
694
+
695
+ if "theme/" in str(xml_file) and xml_file.name.startswith("theme"):
696
+ return self.schemas_dir / self.SCHEMA_MAPPINGS["theme"]
697
+
698
+ if xml_file.parent.name in self.MAIN_CONTENT_FOLDERS:
699
+ return self.schemas_dir / self.SCHEMA_MAPPINGS[xml_file.parent.name]
700
+
701
+ return None
702
+
703
+ def _clean_ignorable_namespaces(self, xml_doc):
704
+ xml_string = lxml.etree.tostring(xml_doc, encoding="unicode")
705
+ xml_copy = lxml.etree.fromstring(xml_string)
706
+
707
+ for elem in xml_copy.iter():
708
+ attrs_to_remove = []
709
+
710
+ for attr in elem.attrib:
711
+ if "{" in attr:
712
+ ns = attr.split("}")[0][1:]
713
+ if ns not in self.OOXML_NAMESPACES:
714
+ attrs_to_remove.append(attr)
715
+
716
+ for attr in attrs_to_remove:
717
+ del elem.attrib[attr]
718
+
719
+ self._remove_ignorable_elements(xml_copy)
720
+
721
+ return lxml.etree.ElementTree(xml_copy)
722
+
723
+ def _remove_ignorable_elements(self, root):
724
+ elements_to_remove = []
725
+
726
+ for elem in list(root):
727
+ if not hasattr(elem, "tag") or callable(elem.tag):
728
+ continue
729
+
730
+ tag_str = str(elem.tag)
731
+ if tag_str.startswith("{"):
732
+ ns = tag_str.split("}")[0][1:]
733
+ if ns not in self.OOXML_NAMESPACES:
734
+ elements_to_remove.append(elem)
735
+ continue
736
+
737
+ self._remove_ignorable_elements(elem)
738
+
739
+ for elem in elements_to_remove:
740
+ root.remove(elem)
741
+
742
+ def _preprocess_for_mc_ignorable(self, xml_doc):
743
+ root = xml_doc.getroot()
744
+
745
+ if f"{{{self.MC_NAMESPACE}}}Ignorable" in root.attrib:
746
+ del root.attrib[f"{{{self.MC_NAMESPACE}}}Ignorable"]
747
+
748
+ return xml_doc
749
+
750
+ def _validate_single_file_xsd(self, xml_file, base_path):
751
+ schema_path = self._get_schema_path(xml_file)
752
+ if not schema_path:
753
+ return None, None
754
+
755
+ try:
756
+ with open(schema_path, "rb") as xsd_file:
757
+ parser = lxml.etree.XMLParser()
758
+ xsd_doc = lxml.etree.parse(
759
+ xsd_file, parser=parser, base_url=str(schema_path)
760
+ )
761
+ schema = lxml.etree.XMLSchema(xsd_doc)
762
+
763
+ with open(xml_file, "r") as f:
764
+ xml_doc = lxml.etree.parse(f)
765
+
766
+ xml_doc, _ = self._remove_template_tags_from_text_nodes(xml_doc)
767
+ xml_doc = self._preprocess_for_mc_ignorable(xml_doc)
768
+
769
+ relative_path = xml_file.relative_to(base_path)
770
+ if (
771
+ relative_path.parts
772
+ and relative_path.parts[0] in self.MAIN_CONTENT_FOLDERS
773
+ ):
774
+ xml_doc = self._clean_ignorable_namespaces(xml_doc)
775
+
776
+ if schema.validate(xml_doc):
777
+ return True, set()
778
+ else:
779
+ errors = set()
780
+ for error in schema.error_log:
781
+ errors.add(error.message)
782
+ return False, errors
783
+
784
+ except Exception as e:
785
+ return False, {str(e)}
786
+
787
+ def _get_original_file_errors(self, xml_file):
788
+ if self.original_file is None:
789
+ return set()
790
+
791
+ import tempfile
792
+ import zipfile
793
+
794
+ xml_file = Path(xml_file).resolve()
795
+ unpacked_dir = self.unpacked_dir.resolve()
796
+ relative_path = xml_file.relative_to(unpacked_dir)
797
+
798
+ with tempfile.TemporaryDirectory() as temp_dir:
799
+ temp_path = Path(temp_dir)
800
+
801
+ with zipfile.ZipFile(self.original_file, "r") as zip_ref:
802
+ zip_ref.extractall(temp_path)
803
+
804
+ original_xml_file = temp_path / relative_path
805
+
806
+ if not original_xml_file.exists():
807
+ return set()
808
+
809
+ is_valid, errors = self._validate_single_file_xsd(
810
+ original_xml_file, temp_path
811
+ )
812
+ return errors if errors else set()
813
+
814
+ def _remove_template_tags_from_text_nodes(self, xml_doc):
815
+ warnings = []
816
+ template_pattern = re.compile(r"\{\{[^}]*\}\}")
817
+
818
+ xml_string = lxml.etree.tostring(xml_doc, encoding="unicode")
819
+ xml_copy = lxml.etree.fromstring(xml_string)
820
+
821
+ def process_text_content(text, content_type):
822
+ if not text:
823
+ return text
824
+ matches = list(template_pattern.finditer(text))
825
+ if matches:
826
+ for match in matches:
827
+ warnings.append(
828
+ f"Found template tag in {content_type}: {match.group()}"
829
+ )
830
+ return template_pattern.sub("", text)
831
+ return text
832
+
833
+ for elem in xml_copy.iter():
834
+ if not hasattr(elem, "tag") or callable(elem.tag):
835
+ continue
836
+ tag_str = str(elem.tag)
837
+ if tag_str.endswith("}t") or tag_str == "t":
838
+ continue
839
+
840
+ elem.text = process_text_content(elem.text, "text content")
841
+ elem.tail = process_text_content(elem.tail, "tail content")
842
+
843
+ return lxml.etree.ElementTree(xml_copy), warnings
844
+
845
+
846
+ if __name__ == "__main__":
847
+ raise RuntimeError("This module should not be run directly.")