@papert-code/papert-code 0.3.94 → 0.3.96
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +21 -0
- package/dist/chunks/{chunk-OIA427PZ.js → chunk-HSYOWGEB.js} +1 -1
- package/dist/chunks/{chunk-6ZOXSA5F.js → chunk-IK4ISYCE.js} +4 -4
- package/dist/chunks/{chunk-JATIVKZP.js → chunk-KBPFDUTA.js} +55 -10
- package/dist/chunks/{chunk-7T4OCWHU.js → chunk-TNDQXJLA.js} +1931 -787
- package/dist/chunks/{gemini-WYRXV2QC.js → gemini-MVJNXCFF.js} +20547 -16879
- package/dist/chunks/{openaiContentGenerator-EAVO6L3Y.js → openaiContentGenerator-GTG5MK5E.js} +2 -2
- package/dist/chunks/{papertContentGenerator-G4SBF3DR.js → papertContentGenerator-Q5TTXUE6.js} +3 -3
- package/dist/chunks/{server-N2U4FF55.js → server-6D3KYATG.js} +7 -1
- package/dist/cli.js +5 -4
- package/dist/sandbox-macos-permissive-proxied.sb +1 -1
- package/dist/sandbox-macos-restrictive-proxied.sb +1 -1
- package/dist/skills/algorithmic-art/SKILL.md +405 -0
- package/dist/skills/algorithmic-art/templates/generator_template.js +223 -0
- package/dist/skills/algorithmic-art/templates/viewer.html +599 -0
- package/dist/skills/brand-guidelines/SKILL.md +73 -0
- package/dist/skills/canvas-design/SKILL.md +130 -0
- package/dist/skills/canvas-design/canvas-fonts/ArsenalSC-OFL.txt +93 -0
- package/dist/skills/canvas-design/canvas-fonts/ArsenalSC-Regular.ttf +0 -0
- package/dist/skills/canvas-design/canvas-fonts/BigShoulders-Bold.ttf +0 -0
- package/dist/skills/canvas-design/canvas-fonts/BigShoulders-OFL.txt +93 -0
- package/dist/skills/canvas-design/canvas-fonts/BigShoulders-Regular.ttf +0 -0
- package/dist/skills/canvas-design/canvas-fonts/Boldonse-OFL.txt +93 -0
- package/dist/skills/canvas-design/canvas-fonts/Boldonse-Regular.ttf +0 -0
- package/dist/skills/canvas-design/canvas-fonts/BricolageGrotesque-Bold.ttf +0 -0
- package/dist/skills/canvas-design/canvas-fonts/BricolageGrotesque-OFL.txt +93 -0
- package/dist/skills/canvas-design/canvas-fonts/BricolageGrotesque-Regular.ttf +0 -0
- package/dist/skills/canvas-design/canvas-fonts/CrimsonPro-Bold.ttf +0 -0
- package/dist/skills/canvas-design/canvas-fonts/CrimsonPro-Italic.ttf +0 -0
- package/dist/skills/canvas-design/canvas-fonts/CrimsonPro-OFL.txt +93 -0
- package/dist/skills/canvas-design/canvas-fonts/CrimsonPro-Regular.ttf +0 -0
- package/dist/skills/canvas-design/canvas-fonts/DMMono-OFL.txt +93 -0
- package/dist/skills/canvas-design/canvas-fonts/DMMono-Regular.ttf +0 -0
- package/dist/skills/canvas-design/canvas-fonts/EricaOne-OFL.txt +94 -0
- package/dist/skills/canvas-design/canvas-fonts/EricaOne-Regular.ttf +0 -0
- package/dist/skills/canvas-design/canvas-fonts/GeistMono-Bold.ttf +0 -0
- package/dist/skills/canvas-design/canvas-fonts/GeistMono-OFL.txt +93 -0
- package/dist/skills/canvas-design/canvas-fonts/GeistMono-Regular.ttf +0 -0
- package/dist/skills/canvas-design/canvas-fonts/Gloock-OFL.txt +93 -0
- package/dist/skills/canvas-design/canvas-fonts/Gloock-Regular.ttf +0 -0
- package/dist/skills/canvas-design/canvas-fonts/IBMPlexMono-Bold.ttf +0 -0
- package/dist/skills/canvas-design/canvas-fonts/IBMPlexMono-OFL.txt +93 -0
- package/dist/skills/canvas-design/canvas-fonts/IBMPlexMono-Regular.ttf +0 -0
- package/dist/skills/canvas-design/canvas-fonts/IBMPlexSerif-Bold.ttf +0 -0
- package/dist/skills/canvas-design/canvas-fonts/IBMPlexSerif-BoldItalic.ttf +0 -0
- package/dist/skills/canvas-design/canvas-fonts/IBMPlexSerif-Italic.ttf +0 -0
- package/dist/skills/canvas-design/canvas-fonts/IBMPlexSerif-Regular.ttf +0 -0
- package/dist/skills/canvas-design/canvas-fonts/InstrumentSans-Bold.ttf +0 -0
- package/dist/skills/canvas-design/canvas-fonts/InstrumentSans-BoldItalic.ttf +0 -0
- package/dist/skills/canvas-design/canvas-fonts/InstrumentSans-Italic.ttf +0 -0
- package/dist/skills/canvas-design/canvas-fonts/InstrumentSans-OFL.txt +93 -0
- package/dist/skills/canvas-design/canvas-fonts/InstrumentSans-Regular.ttf +0 -0
- package/dist/skills/canvas-design/canvas-fonts/InstrumentSerif-Italic.ttf +0 -0
- package/dist/skills/canvas-design/canvas-fonts/InstrumentSerif-Regular.ttf +0 -0
- package/dist/skills/canvas-design/canvas-fonts/Italiana-OFL.txt +93 -0
- package/dist/skills/canvas-design/canvas-fonts/Italiana-Regular.ttf +0 -0
- package/dist/skills/canvas-design/canvas-fonts/JetBrainsMono-Bold.ttf +0 -0
- package/dist/skills/canvas-design/canvas-fonts/JetBrainsMono-OFL.txt +93 -0
- package/dist/skills/canvas-design/canvas-fonts/JetBrainsMono-Regular.ttf +0 -0
- package/dist/skills/canvas-design/canvas-fonts/Jura-Light.ttf +0 -0
- package/dist/skills/canvas-design/canvas-fonts/Jura-Medium.ttf +0 -0
- package/dist/skills/canvas-design/canvas-fonts/Jura-OFL.txt +93 -0
- package/dist/skills/canvas-design/canvas-fonts/LibreBaskerville-OFL.txt +93 -0
- package/dist/skills/canvas-design/canvas-fonts/LibreBaskerville-Regular.ttf +0 -0
- package/dist/skills/canvas-design/canvas-fonts/Lora-Bold.ttf +0 -0
- package/dist/skills/canvas-design/canvas-fonts/Lora-BoldItalic.ttf +0 -0
- package/dist/skills/canvas-design/canvas-fonts/Lora-Italic.ttf +0 -0
- package/dist/skills/canvas-design/canvas-fonts/Lora-OFL.txt +93 -0
- package/dist/skills/canvas-design/canvas-fonts/Lora-Regular.ttf +0 -0
- package/dist/skills/canvas-design/canvas-fonts/NationalPark-Bold.ttf +0 -0
- package/dist/skills/canvas-design/canvas-fonts/NationalPark-OFL.txt +93 -0
- package/dist/skills/canvas-design/canvas-fonts/NationalPark-Regular.ttf +0 -0
- package/dist/skills/canvas-design/canvas-fonts/NothingYouCouldDo-OFL.txt +93 -0
- package/dist/skills/canvas-design/canvas-fonts/NothingYouCouldDo-Regular.ttf +0 -0
- package/dist/skills/canvas-design/canvas-fonts/Outfit-Bold.ttf +0 -0
- package/dist/skills/canvas-design/canvas-fonts/Outfit-OFL.txt +93 -0
- package/dist/skills/canvas-design/canvas-fonts/Outfit-Regular.ttf +0 -0
- package/dist/skills/canvas-design/canvas-fonts/PixelifySans-Medium.ttf +0 -0
- package/dist/skills/canvas-design/canvas-fonts/PixelifySans-OFL.txt +93 -0
- package/dist/skills/canvas-design/canvas-fonts/PoiretOne-OFL.txt +93 -0
- package/dist/skills/canvas-design/canvas-fonts/PoiretOne-Regular.ttf +0 -0
- package/dist/skills/canvas-design/canvas-fonts/RedHatMono-Bold.ttf +0 -0
- package/dist/skills/canvas-design/canvas-fonts/RedHatMono-OFL.txt +93 -0
- package/dist/skills/canvas-design/canvas-fonts/RedHatMono-Regular.ttf +0 -0
- package/dist/skills/canvas-design/canvas-fonts/Silkscreen-OFL.txt +93 -0
- package/dist/skills/canvas-design/canvas-fonts/Silkscreen-Regular.ttf +0 -0
- package/dist/skills/canvas-design/canvas-fonts/SmoochSans-Medium.ttf +0 -0
- package/dist/skills/canvas-design/canvas-fonts/SmoochSans-OFL.txt +93 -0
- package/dist/skills/canvas-design/canvas-fonts/Tektur-Medium.ttf +0 -0
- package/dist/skills/canvas-design/canvas-fonts/Tektur-OFL.txt +93 -0
- package/dist/skills/canvas-design/canvas-fonts/Tektur-Regular.ttf +0 -0
- package/dist/skills/canvas-design/canvas-fonts/WorkSans-Bold.ttf +0 -0
- package/dist/skills/canvas-design/canvas-fonts/WorkSans-BoldItalic.ttf +0 -0
- package/dist/skills/canvas-design/canvas-fonts/WorkSans-Italic.ttf +0 -0
- package/dist/skills/canvas-design/canvas-fonts/WorkSans-OFL.txt +93 -0
- package/dist/skills/canvas-design/canvas-fonts/WorkSans-Regular.ttf +0 -0
- package/dist/skills/canvas-design/canvas-fonts/YoungSerif-OFL.txt +93 -0
- package/dist/skills/canvas-design/canvas-fonts/YoungSerif-Regular.ttf +0 -0
- package/dist/skills/doc-coauthoring/SKILL.md +375 -0
- package/dist/skills/docx/SKILL.md +481 -0
- package/dist/skills/docx/scripts/__init__.py +1 -0
- package/dist/skills/docx/scripts/accept_changes.py +135 -0
- package/dist/skills/docx/scripts/comment.py +318 -0
- package/dist/skills/docx/scripts/office/helpers/__init__.py +0 -0
- package/dist/skills/docx/scripts/office/helpers/merge_runs.py +199 -0
- package/dist/skills/docx/scripts/office/helpers/simplify_redlines.py +197 -0
- package/dist/skills/docx/scripts/office/pack.py +159 -0
- package/dist/skills/docx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-chart.xsd +1499 -0
- package/dist/skills/docx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-chartDrawing.xsd +146 -0
- package/dist/skills/docx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-diagram.xsd +1085 -0
- package/dist/skills/docx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-lockedCanvas.xsd +11 -0
- package/dist/skills/docx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-main.xsd +3081 -0
- package/dist/skills/docx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-picture.xsd +23 -0
- package/dist/skills/docx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-spreadsheetDrawing.xsd +185 -0
- package/dist/skills/docx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-wordprocessingDrawing.xsd +287 -0
- package/dist/skills/docx/scripts/office/schemas/ISO-IEC29500-4_2016/pml.xsd +1676 -0
- package/dist/skills/docx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-additionalCharacteristics.xsd +28 -0
- package/dist/skills/docx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-bibliography.xsd +144 -0
- package/dist/skills/docx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-commonSimpleTypes.xsd +174 -0
- package/dist/skills/docx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-customXmlDataProperties.xsd +25 -0
- package/dist/skills/docx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-customXmlSchemaProperties.xsd +18 -0
- package/dist/skills/docx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-documentPropertiesCustom.xsd +59 -0
- package/dist/skills/docx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-documentPropertiesExtended.xsd +56 -0
- package/dist/skills/docx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-documentPropertiesVariantTypes.xsd +195 -0
- package/dist/skills/docx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-math.xsd +582 -0
- package/dist/skills/docx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-relationshipReference.xsd +25 -0
- package/dist/skills/docx/scripts/office/schemas/ISO-IEC29500-4_2016/sml.xsd +4439 -0
- package/dist/skills/docx/scripts/office/schemas/ISO-IEC29500-4_2016/vml-main.xsd +570 -0
- package/dist/skills/docx/scripts/office/schemas/ISO-IEC29500-4_2016/vml-officeDrawing.xsd +509 -0
- package/dist/skills/docx/scripts/office/schemas/ISO-IEC29500-4_2016/vml-presentationDrawing.xsd +12 -0
- package/dist/skills/docx/scripts/office/schemas/ISO-IEC29500-4_2016/vml-spreadsheetDrawing.xsd +108 -0
- package/dist/skills/docx/scripts/office/schemas/ISO-IEC29500-4_2016/vml-wordprocessingDrawing.xsd +96 -0
- package/dist/skills/docx/scripts/office/schemas/ISO-IEC29500-4_2016/wml.xsd +3646 -0
- package/dist/skills/docx/scripts/office/schemas/ISO-IEC29500-4_2016/xml.xsd +116 -0
- package/dist/skills/docx/scripts/office/schemas/ecma/fouth-edition/opc-contentTypes.xsd +42 -0
- package/dist/skills/docx/scripts/office/schemas/ecma/fouth-edition/opc-coreProperties.xsd +50 -0
- package/dist/skills/docx/scripts/office/schemas/ecma/fouth-edition/opc-digSig.xsd +49 -0
- package/dist/skills/docx/scripts/office/schemas/ecma/fouth-edition/opc-relationships.xsd +33 -0
- package/dist/skills/docx/scripts/office/schemas/mce/mc.xsd +75 -0
- package/dist/skills/docx/scripts/office/schemas/microsoft/wml-2010.xsd +560 -0
- package/dist/skills/docx/scripts/office/schemas/microsoft/wml-2012.xsd +67 -0
- package/dist/skills/docx/scripts/office/schemas/microsoft/wml-2018.xsd +14 -0
- package/dist/skills/docx/scripts/office/schemas/microsoft/wml-cex-2018.xsd +20 -0
- package/dist/skills/docx/scripts/office/schemas/microsoft/wml-cid-2016.xsd +13 -0
- package/dist/skills/docx/scripts/office/schemas/microsoft/wml-sdtdatahash-2020.xsd +4 -0
- package/dist/skills/docx/scripts/office/schemas/microsoft/wml-symex-2015.xsd +8 -0
- package/dist/skills/docx/scripts/office/soffice.py +183 -0
- package/dist/skills/docx/scripts/office/unpack.py +132 -0
- package/dist/skills/docx/scripts/office/validate.py +111 -0
- package/dist/skills/docx/scripts/office/validators/__init__.py +15 -0
- package/dist/skills/docx/scripts/office/validators/base.py +847 -0
- package/dist/skills/docx/scripts/office/validators/docx.py +446 -0
- package/dist/skills/docx/scripts/office/validators/pptx.py +275 -0
- package/dist/skills/docx/scripts/office/validators/redlining.py +247 -0
- package/dist/skills/docx/scripts/templates/comments.xml +3 -0
- package/dist/skills/docx/scripts/templates/commentsExtended.xml +3 -0
- package/dist/skills/docx/scripts/templates/commentsExtensible.xml +3 -0
- package/dist/skills/docx/scripts/templates/commentsIds.xml +3 -0
- package/dist/skills/docx/scripts/templates/people.xml +3 -0
- package/dist/skills/frontend-design/SKILL.md +42 -0
- package/dist/skills/internal-comms/SKILL.md +32 -0
- package/dist/skills/internal-comms/examples/3p-updates.md +47 -0
- package/dist/skills/internal-comms/examples/company-newsletter.md +65 -0
- package/dist/skills/internal-comms/examples/faq-answers.md +30 -0
- package/dist/skills/internal-comms/examples/general-comms.md +16 -0
- package/dist/skills/mcp-builder/SKILL.md +236 -0
- package/dist/skills/mcp-builder/reference/evaluation.md +602 -0
- package/dist/skills/mcp-builder/reference/mcp_best_practices.md +249 -0
- package/dist/skills/mcp-builder/reference/node_mcp_server.md +970 -0
- package/dist/skills/mcp-builder/reference/python_mcp_server.md +719 -0
- package/dist/skills/mcp-builder/scripts/connections.py +151 -0
- package/dist/skills/mcp-builder/scripts/evaluation.py +373 -0
- package/dist/skills/mcp-builder/scripts/example_evaluation.xml +22 -0
- package/dist/skills/mcp-builder/scripts/requirements.txt +2 -0
- package/dist/skills/papert-code/SKILL.md +561 -0
- package/dist/skills/pdf/SKILL.md +314 -0
- package/dist/skills/pdf/forms.md +294 -0
- package/dist/skills/pdf/reference.md +612 -0
- package/dist/skills/pdf/scripts/check_bounding_boxes.py +65 -0
- package/dist/skills/pdf/scripts/check_fillable_fields.py +11 -0
- package/dist/skills/pdf/scripts/convert_pdf_to_images.py +33 -0
- package/dist/skills/pdf/scripts/create_validation_image.py +37 -0
- package/dist/skills/pdf/scripts/extract_form_field_info.py +122 -0
- package/dist/skills/pdf/scripts/extract_form_structure.py +115 -0
- package/dist/skills/pdf/scripts/fill_fillable_fields.py +98 -0
- package/dist/skills/pdf/scripts/fill_pdf_form_with_annotations.py +107 -0
- package/dist/skills/pptx/SKILL.md +232 -0
- package/dist/skills/pptx/editing.md +205 -0
- package/dist/skills/pptx/pptxgenjs.md +420 -0
- package/dist/skills/pptx/scripts/__init__.py +0 -0
- package/dist/skills/pptx/scripts/add_slide.py +195 -0
- package/dist/skills/pptx/scripts/clean.py +286 -0
- package/dist/skills/pptx/scripts/office/helpers/__init__.py +0 -0
- package/dist/skills/pptx/scripts/office/helpers/merge_runs.py +199 -0
- package/dist/skills/pptx/scripts/office/helpers/simplify_redlines.py +197 -0
- package/dist/skills/pptx/scripts/office/pack.py +159 -0
- package/dist/skills/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-chart.xsd +1499 -0
- package/dist/skills/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-chartDrawing.xsd +146 -0
- package/dist/skills/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-diagram.xsd +1085 -0
- package/dist/skills/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-lockedCanvas.xsd +11 -0
- package/dist/skills/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-main.xsd +3081 -0
- package/dist/skills/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-picture.xsd +23 -0
- package/dist/skills/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-spreadsheetDrawing.xsd +185 -0
- package/dist/skills/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-wordprocessingDrawing.xsd +287 -0
- package/dist/skills/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/pml.xsd +1676 -0
- package/dist/skills/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-additionalCharacteristics.xsd +28 -0
- package/dist/skills/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-bibliography.xsd +144 -0
- package/dist/skills/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-commonSimpleTypes.xsd +174 -0
- package/dist/skills/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-customXmlDataProperties.xsd +25 -0
- package/dist/skills/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-customXmlSchemaProperties.xsd +18 -0
- package/dist/skills/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-documentPropertiesCustom.xsd +59 -0
- package/dist/skills/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-documentPropertiesExtended.xsd +56 -0
- package/dist/skills/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-documentPropertiesVariantTypes.xsd +195 -0
- package/dist/skills/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-math.xsd +582 -0
- package/dist/skills/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-relationshipReference.xsd +25 -0
- package/dist/skills/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/sml.xsd +4439 -0
- package/dist/skills/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/vml-main.xsd +570 -0
- package/dist/skills/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/vml-officeDrawing.xsd +509 -0
- package/dist/skills/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/vml-presentationDrawing.xsd +12 -0
- package/dist/skills/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/vml-spreadsheetDrawing.xsd +108 -0
- package/dist/skills/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/vml-wordprocessingDrawing.xsd +96 -0
- package/dist/skills/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/wml.xsd +3646 -0
- package/dist/skills/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/xml.xsd +116 -0
- package/dist/skills/pptx/scripts/office/schemas/ecma/fouth-edition/opc-contentTypes.xsd +42 -0
- package/dist/skills/pptx/scripts/office/schemas/ecma/fouth-edition/opc-coreProperties.xsd +50 -0
- package/dist/skills/pptx/scripts/office/schemas/ecma/fouth-edition/opc-digSig.xsd +49 -0
- package/dist/skills/pptx/scripts/office/schemas/ecma/fouth-edition/opc-relationships.xsd +33 -0
- package/dist/skills/pptx/scripts/office/schemas/mce/mc.xsd +75 -0
- package/dist/skills/pptx/scripts/office/schemas/microsoft/wml-2010.xsd +560 -0
- package/dist/skills/pptx/scripts/office/schemas/microsoft/wml-2012.xsd +67 -0
- package/dist/skills/pptx/scripts/office/schemas/microsoft/wml-2018.xsd +14 -0
- package/dist/skills/pptx/scripts/office/schemas/microsoft/wml-cex-2018.xsd +20 -0
- package/dist/skills/pptx/scripts/office/schemas/microsoft/wml-cid-2016.xsd +13 -0
- package/dist/skills/pptx/scripts/office/schemas/microsoft/wml-sdtdatahash-2020.xsd +4 -0
- package/dist/skills/pptx/scripts/office/schemas/microsoft/wml-symex-2015.xsd +8 -0
- package/dist/skills/pptx/scripts/office/soffice.py +183 -0
- package/dist/skills/pptx/scripts/office/unpack.py +132 -0
- package/dist/skills/pptx/scripts/office/validate.py +111 -0
- package/dist/skills/pptx/scripts/office/validators/__init__.py +15 -0
- package/dist/skills/pptx/scripts/office/validators/base.py +847 -0
- package/dist/skills/pptx/scripts/office/validators/docx.py +446 -0
- package/dist/skills/pptx/scripts/office/validators/pptx.py +275 -0
- package/dist/skills/pptx/scripts/office/validators/redlining.py +247 -0
- package/dist/skills/pptx/scripts/thumbnail.py +289 -0
- package/dist/skills/skill-creator/SKILL.md +357 -0
- package/dist/skills/skill-creator/references/output-patterns.md +82 -0
- package/dist/skills/skill-creator/references/workflows.md +28 -0
- package/dist/skills/skill-creator/scripts/init_skill.py +303 -0
- package/dist/skills/skill-creator/scripts/package_skill.py +110 -0
- package/dist/skills/skill-creator/scripts/quick_validate.py +103 -0
- package/dist/skills/slack-gif-creator/SKILL.md +254 -0
- package/dist/skills/slack-gif-creator/core/easing.py +234 -0
- package/dist/skills/slack-gif-creator/core/frame_composer.py +176 -0
- package/dist/skills/slack-gif-creator/core/gif_builder.py +269 -0
- package/dist/skills/slack-gif-creator/core/validators.py +136 -0
- package/dist/skills/slack-gif-creator/requirements.txt +4 -0
- package/dist/skills/theme-factory/SKILL.md +59 -0
- package/dist/skills/theme-factory/theme-showcase.pdf +0 -0
- package/dist/skills/theme-factory/themes/arctic-frost.md +19 -0
- package/dist/skills/theme-factory/themes/botanical-garden.md +19 -0
- package/dist/skills/theme-factory/themes/desert-rose.md +19 -0
- package/dist/skills/theme-factory/themes/forest-canopy.md +19 -0
- package/dist/skills/theme-factory/themes/golden-hour.md +19 -0
- package/dist/skills/theme-factory/themes/midnight-galaxy.md +19 -0
- package/dist/skills/theme-factory/themes/modern-minimalist.md +19 -0
- package/dist/skills/theme-factory/themes/ocean-depths.md +19 -0
- package/dist/skills/theme-factory/themes/sunset-boulevard.md +19 -0
- package/dist/skills/theme-factory/themes/tech-innovation.md +19 -0
- package/dist/skills/web-artifacts-builder/SKILL.md +74 -0
- package/dist/skills/web-artifacts-builder/scripts/bundle-artifact.sh +54 -0
- package/dist/skills/web-artifacts-builder/scripts/init-artifact.sh +322 -0
- package/dist/skills/web-artifacts-builder/scripts/shadcn-components.tar.gz +0 -0
- package/dist/skills/webapp-testing/SKILL.md +96 -0
- package/dist/skills/webapp-testing/examples/console_logging.py +35 -0
- package/dist/skills/webapp-testing/examples/element_discovery.py +40 -0
- package/dist/skills/webapp-testing/examples/static_html_automation.py +33 -0
- package/dist/skills/webapp-testing/scripts/with_server.py +106 -0
- package/dist/skills/xlsx/SKILL.md +292 -0
- package/dist/skills/xlsx/scripts/office/helpers/__init__.py +0 -0
- package/dist/skills/xlsx/scripts/office/helpers/merge_runs.py +199 -0
- package/dist/skills/xlsx/scripts/office/helpers/simplify_redlines.py +197 -0
- package/dist/skills/xlsx/scripts/office/pack.py +159 -0
- package/dist/skills/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-chart.xsd +1499 -0
- package/dist/skills/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-chartDrawing.xsd +146 -0
- package/dist/skills/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-diagram.xsd +1085 -0
- package/dist/skills/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-lockedCanvas.xsd +11 -0
- package/dist/skills/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-main.xsd +3081 -0
- package/dist/skills/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-picture.xsd +23 -0
- package/dist/skills/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-spreadsheetDrawing.xsd +185 -0
- package/dist/skills/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-wordprocessingDrawing.xsd +287 -0
- package/dist/skills/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/pml.xsd +1676 -0
- package/dist/skills/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-additionalCharacteristics.xsd +28 -0
- package/dist/skills/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-bibliography.xsd +144 -0
- package/dist/skills/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-commonSimpleTypes.xsd +174 -0
- package/dist/skills/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-customXmlDataProperties.xsd +25 -0
- package/dist/skills/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-customXmlSchemaProperties.xsd +18 -0
- package/dist/skills/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-documentPropertiesCustom.xsd +59 -0
- package/dist/skills/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-documentPropertiesExtended.xsd +56 -0
- package/dist/skills/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-documentPropertiesVariantTypes.xsd +195 -0
- package/dist/skills/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-math.xsd +582 -0
- package/dist/skills/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-relationshipReference.xsd +25 -0
- package/dist/skills/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/sml.xsd +4439 -0
- package/dist/skills/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/vml-main.xsd +570 -0
- package/dist/skills/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/vml-officeDrawing.xsd +509 -0
- package/dist/skills/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/vml-presentationDrawing.xsd +12 -0
- package/dist/skills/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/vml-spreadsheetDrawing.xsd +108 -0
- package/dist/skills/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/vml-wordprocessingDrawing.xsd +96 -0
- package/dist/skills/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/wml.xsd +3646 -0
- package/dist/skills/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/xml.xsd +116 -0
- package/dist/skills/xlsx/scripts/office/schemas/ecma/fouth-edition/opc-contentTypes.xsd +42 -0
- package/dist/skills/xlsx/scripts/office/schemas/ecma/fouth-edition/opc-coreProperties.xsd +50 -0
- package/dist/skills/xlsx/scripts/office/schemas/ecma/fouth-edition/opc-digSig.xsd +49 -0
- package/dist/skills/xlsx/scripts/office/schemas/ecma/fouth-edition/opc-relationships.xsd +33 -0
- package/dist/skills/xlsx/scripts/office/schemas/mce/mc.xsd +75 -0
- package/dist/skills/xlsx/scripts/office/schemas/microsoft/wml-2010.xsd +560 -0
- package/dist/skills/xlsx/scripts/office/schemas/microsoft/wml-2012.xsd +67 -0
- package/dist/skills/xlsx/scripts/office/schemas/microsoft/wml-2018.xsd +14 -0
- package/dist/skills/xlsx/scripts/office/schemas/microsoft/wml-cex-2018.xsd +20 -0
- package/dist/skills/xlsx/scripts/office/schemas/microsoft/wml-cid-2016.xsd +13 -0
- package/dist/skills/xlsx/scripts/office/schemas/microsoft/wml-sdtdatahash-2020.xsd +4 -0
- package/dist/skills/xlsx/scripts/office/schemas/microsoft/wml-symex-2015.xsd +8 -0
- package/dist/skills/xlsx/scripts/office/soffice.py +183 -0
- package/dist/skills/xlsx/scripts/office/unpack.py +132 -0
- package/dist/skills/xlsx/scripts/office/validate.py +111 -0
- package/dist/skills/xlsx/scripts/office/validators/__init__.py +15 -0
- package/dist/skills/xlsx/scripts/office/validators/base.py +847 -0
- package/dist/skills/xlsx/scripts/office/validators/docx.py +446 -0
- package/dist/skills/xlsx/scripts/office/validators/pptx.py +275 -0
- package/dist/skills/xlsx/scripts/office/validators/redlining.py +247 -0
- package/dist/skills/xlsx/scripts/recalc.py +184 -0
- package/package.json +11 -4
|
@@ -0,0 +1,286 @@
|
|
|
1
|
+
"""Remove unreferenced files from an unpacked PPTX directory.
|
|
2
|
+
|
|
3
|
+
Usage: python clean.py <unpacked_dir>
|
|
4
|
+
|
|
5
|
+
Example:
|
|
6
|
+
python clean.py unpacked/
|
|
7
|
+
|
|
8
|
+
This script removes:
|
|
9
|
+
- Orphaned slides (not in sldIdLst) and their relationships
|
|
10
|
+
- [trash] directory (unreferenced files)
|
|
11
|
+
- Orphaned .rels files for deleted resources
|
|
12
|
+
- Unreferenced media, embeddings, charts, diagrams, drawings, ink files
|
|
13
|
+
- Unreferenced theme files
|
|
14
|
+
- Unreferenced notes slides
|
|
15
|
+
- Content-Type overrides for deleted files
|
|
16
|
+
"""
|
|
17
|
+
|
|
18
|
+
import sys
|
|
19
|
+
from pathlib import Path
|
|
20
|
+
|
|
21
|
+
import defusedxml.minidom
|
|
22
|
+
|
|
23
|
+
|
|
24
|
+
import re
|
|
25
|
+
|
|
26
|
+
|
|
27
|
+
def get_slides_in_sldidlst(unpacked_dir: Path) -> set[str]:
|
|
28
|
+
pres_path = unpacked_dir / "ppt" / "presentation.xml"
|
|
29
|
+
pres_rels_path = unpacked_dir / "ppt" / "_rels" / "presentation.xml.rels"
|
|
30
|
+
|
|
31
|
+
if not pres_path.exists() or not pres_rels_path.exists():
|
|
32
|
+
return set()
|
|
33
|
+
|
|
34
|
+
rels_dom = defusedxml.minidom.parse(str(pres_rels_path))
|
|
35
|
+
rid_to_slide = {}
|
|
36
|
+
for rel in rels_dom.getElementsByTagName("Relationship"):
|
|
37
|
+
rid = rel.getAttribute("Id")
|
|
38
|
+
target = rel.getAttribute("Target")
|
|
39
|
+
rel_type = rel.getAttribute("Type")
|
|
40
|
+
if "slide" in rel_type and target.startswith("slides/"):
|
|
41
|
+
rid_to_slide[rid] = target.replace("slides/", "")
|
|
42
|
+
|
|
43
|
+
pres_content = pres_path.read_text(encoding="utf-8")
|
|
44
|
+
referenced_rids = set(re.findall(r'<p:sldId[^>]*r:id="([^"]+)"', pres_content))
|
|
45
|
+
|
|
46
|
+
return {rid_to_slide[rid] for rid in referenced_rids if rid in rid_to_slide}
|
|
47
|
+
|
|
48
|
+
|
|
49
|
+
def remove_orphaned_slides(unpacked_dir: Path) -> list[str]:
|
|
50
|
+
slides_dir = unpacked_dir / "ppt" / "slides"
|
|
51
|
+
slides_rels_dir = slides_dir / "_rels"
|
|
52
|
+
pres_rels_path = unpacked_dir / "ppt" / "_rels" / "presentation.xml.rels"
|
|
53
|
+
|
|
54
|
+
if not slides_dir.exists():
|
|
55
|
+
return []
|
|
56
|
+
|
|
57
|
+
referenced_slides = get_slides_in_sldidlst(unpacked_dir)
|
|
58
|
+
removed = []
|
|
59
|
+
|
|
60
|
+
for slide_file in slides_dir.glob("slide*.xml"):
|
|
61
|
+
if slide_file.name not in referenced_slides:
|
|
62
|
+
rel_path = slide_file.relative_to(unpacked_dir)
|
|
63
|
+
slide_file.unlink()
|
|
64
|
+
removed.append(str(rel_path))
|
|
65
|
+
|
|
66
|
+
rels_file = slides_rels_dir / f"{slide_file.name}.rels"
|
|
67
|
+
if rels_file.exists():
|
|
68
|
+
rels_file.unlink()
|
|
69
|
+
removed.append(str(rels_file.relative_to(unpacked_dir)))
|
|
70
|
+
|
|
71
|
+
if removed and pres_rels_path.exists():
|
|
72
|
+
rels_dom = defusedxml.minidom.parse(str(pres_rels_path))
|
|
73
|
+
changed = False
|
|
74
|
+
|
|
75
|
+
for rel in list(rels_dom.getElementsByTagName("Relationship")):
|
|
76
|
+
target = rel.getAttribute("Target")
|
|
77
|
+
if target.startswith("slides/"):
|
|
78
|
+
slide_name = target.replace("slides/", "")
|
|
79
|
+
if slide_name not in referenced_slides:
|
|
80
|
+
if rel.parentNode:
|
|
81
|
+
rel.parentNode.removeChild(rel)
|
|
82
|
+
changed = True
|
|
83
|
+
|
|
84
|
+
if changed:
|
|
85
|
+
with open(pres_rels_path, "wb") as f:
|
|
86
|
+
f.write(rels_dom.toxml(encoding="utf-8"))
|
|
87
|
+
|
|
88
|
+
return removed
|
|
89
|
+
|
|
90
|
+
|
|
91
|
+
def remove_trash_directory(unpacked_dir: Path) -> list[str]:
|
|
92
|
+
trash_dir = unpacked_dir / "[trash]"
|
|
93
|
+
removed = []
|
|
94
|
+
|
|
95
|
+
if trash_dir.exists() and trash_dir.is_dir():
|
|
96
|
+
for file_path in trash_dir.iterdir():
|
|
97
|
+
if file_path.is_file():
|
|
98
|
+
rel_path = file_path.relative_to(unpacked_dir)
|
|
99
|
+
removed.append(str(rel_path))
|
|
100
|
+
file_path.unlink()
|
|
101
|
+
trash_dir.rmdir()
|
|
102
|
+
|
|
103
|
+
return removed
|
|
104
|
+
|
|
105
|
+
|
|
106
|
+
def get_slide_referenced_files(unpacked_dir: Path) -> set:
|
|
107
|
+
referenced = set()
|
|
108
|
+
slides_rels_dir = unpacked_dir / "ppt" / "slides" / "_rels"
|
|
109
|
+
|
|
110
|
+
if not slides_rels_dir.exists():
|
|
111
|
+
return referenced
|
|
112
|
+
|
|
113
|
+
for rels_file in slides_rels_dir.glob("*.rels"):
|
|
114
|
+
dom = defusedxml.minidom.parse(str(rels_file))
|
|
115
|
+
for rel in dom.getElementsByTagName("Relationship"):
|
|
116
|
+
target = rel.getAttribute("Target")
|
|
117
|
+
if not target:
|
|
118
|
+
continue
|
|
119
|
+
target_path = (rels_file.parent.parent / target).resolve()
|
|
120
|
+
try:
|
|
121
|
+
referenced.add(target_path.relative_to(unpacked_dir.resolve()))
|
|
122
|
+
except ValueError:
|
|
123
|
+
pass
|
|
124
|
+
|
|
125
|
+
return referenced
|
|
126
|
+
|
|
127
|
+
|
|
128
|
+
def remove_orphaned_rels_files(unpacked_dir: Path) -> list[str]:
|
|
129
|
+
resource_dirs = ["charts", "diagrams", "drawings"]
|
|
130
|
+
removed = []
|
|
131
|
+
slide_referenced = get_slide_referenced_files(unpacked_dir)
|
|
132
|
+
|
|
133
|
+
for dir_name in resource_dirs:
|
|
134
|
+
rels_dir = unpacked_dir / "ppt" / dir_name / "_rels"
|
|
135
|
+
if not rels_dir.exists():
|
|
136
|
+
continue
|
|
137
|
+
|
|
138
|
+
for rels_file in rels_dir.glob("*.rels"):
|
|
139
|
+
resource_file = rels_dir.parent / rels_file.name.replace(".rels", "")
|
|
140
|
+
try:
|
|
141
|
+
resource_rel_path = resource_file.resolve().relative_to(unpacked_dir.resolve())
|
|
142
|
+
except ValueError:
|
|
143
|
+
continue
|
|
144
|
+
|
|
145
|
+
if not resource_file.exists() or resource_rel_path not in slide_referenced:
|
|
146
|
+
rels_file.unlink()
|
|
147
|
+
rel_path = rels_file.relative_to(unpacked_dir)
|
|
148
|
+
removed.append(str(rel_path))
|
|
149
|
+
|
|
150
|
+
return removed
|
|
151
|
+
|
|
152
|
+
|
|
153
|
+
def get_referenced_files(unpacked_dir: Path) -> set:
|
|
154
|
+
referenced = set()
|
|
155
|
+
|
|
156
|
+
for rels_file in unpacked_dir.rglob("*.rels"):
|
|
157
|
+
dom = defusedxml.minidom.parse(str(rels_file))
|
|
158
|
+
for rel in dom.getElementsByTagName("Relationship"):
|
|
159
|
+
target = rel.getAttribute("Target")
|
|
160
|
+
if not target:
|
|
161
|
+
continue
|
|
162
|
+
target_path = (rels_file.parent.parent / target).resolve()
|
|
163
|
+
try:
|
|
164
|
+
referenced.add(target_path.relative_to(unpacked_dir.resolve()))
|
|
165
|
+
except ValueError:
|
|
166
|
+
pass
|
|
167
|
+
|
|
168
|
+
return referenced
|
|
169
|
+
|
|
170
|
+
|
|
171
|
+
def remove_orphaned_files(unpacked_dir: Path, referenced: set) -> list[str]:
|
|
172
|
+
resource_dirs = ["media", "embeddings", "charts", "diagrams", "tags", "drawings", "ink"]
|
|
173
|
+
removed = []
|
|
174
|
+
|
|
175
|
+
for dir_name in resource_dirs:
|
|
176
|
+
dir_path = unpacked_dir / "ppt" / dir_name
|
|
177
|
+
if not dir_path.exists():
|
|
178
|
+
continue
|
|
179
|
+
|
|
180
|
+
for file_path in dir_path.glob("*"):
|
|
181
|
+
if not file_path.is_file():
|
|
182
|
+
continue
|
|
183
|
+
rel_path = file_path.relative_to(unpacked_dir)
|
|
184
|
+
if rel_path not in referenced:
|
|
185
|
+
file_path.unlink()
|
|
186
|
+
removed.append(str(rel_path))
|
|
187
|
+
|
|
188
|
+
theme_dir = unpacked_dir / "ppt" / "theme"
|
|
189
|
+
if theme_dir.exists():
|
|
190
|
+
for file_path in theme_dir.glob("theme*.xml"):
|
|
191
|
+
rel_path = file_path.relative_to(unpacked_dir)
|
|
192
|
+
if rel_path not in referenced:
|
|
193
|
+
file_path.unlink()
|
|
194
|
+
removed.append(str(rel_path))
|
|
195
|
+
theme_rels = theme_dir / "_rels" / f"{file_path.name}.rels"
|
|
196
|
+
if theme_rels.exists():
|
|
197
|
+
theme_rels.unlink()
|
|
198
|
+
removed.append(str(theme_rels.relative_to(unpacked_dir)))
|
|
199
|
+
|
|
200
|
+
notes_dir = unpacked_dir / "ppt" / "notesSlides"
|
|
201
|
+
if notes_dir.exists():
|
|
202
|
+
for file_path in notes_dir.glob("*.xml"):
|
|
203
|
+
if not file_path.is_file():
|
|
204
|
+
continue
|
|
205
|
+
rel_path = file_path.relative_to(unpacked_dir)
|
|
206
|
+
if rel_path not in referenced:
|
|
207
|
+
file_path.unlink()
|
|
208
|
+
removed.append(str(rel_path))
|
|
209
|
+
|
|
210
|
+
notes_rels_dir = notes_dir / "_rels"
|
|
211
|
+
if notes_rels_dir.exists():
|
|
212
|
+
for file_path in notes_rels_dir.glob("*.rels"):
|
|
213
|
+
notes_file = notes_dir / file_path.name.replace(".rels", "")
|
|
214
|
+
if not notes_file.exists():
|
|
215
|
+
file_path.unlink()
|
|
216
|
+
removed.append(str(file_path.relative_to(unpacked_dir)))
|
|
217
|
+
|
|
218
|
+
return removed
|
|
219
|
+
|
|
220
|
+
|
|
221
|
+
def update_content_types(unpacked_dir: Path, removed_files: list[str]) -> None:
|
|
222
|
+
ct_path = unpacked_dir / "[Content_Types].xml"
|
|
223
|
+
if not ct_path.exists():
|
|
224
|
+
return
|
|
225
|
+
|
|
226
|
+
dom = defusedxml.minidom.parse(str(ct_path))
|
|
227
|
+
changed = False
|
|
228
|
+
|
|
229
|
+
for override in list(dom.getElementsByTagName("Override")):
|
|
230
|
+
part_name = override.getAttribute("PartName").lstrip("/")
|
|
231
|
+
if part_name in removed_files:
|
|
232
|
+
if override.parentNode:
|
|
233
|
+
override.parentNode.removeChild(override)
|
|
234
|
+
changed = True
|
|
235
|
+
|
|
236
|
+
if changed:
|
|
237
|
+
with open(ct_path, "wb") as f:
|
|
238
|
+
f.write(dom.toxml(encoding="utf-8"))
|
|
239
|
+
|
|
240
|
+
|
|
241
|
+
def clean_unused_files(unpacked_dir: Path) -> list[str]:
|
|
242
|
+
all_removed = []
|
|
243
|
+
|
|
244
|
+
slides_removed = remove_orphaned_slides(unpacked_dir)
|
|
245
|
+
all_removed.extend(slides_removed)
|
|
246
|
+
|
|
247
|
+
trash_removed = remove_trash_directory(unpacked_dir)
|
|
248
|
+
all_removed.extend(trash_removed)
|
|
249
|
+
|
|
250
|
+
while True:
|
|
251
|
+
removed_rels = remove_orphaned_rels_files(unpacked_dir)
|
|
252
|
+
referenced = get_referenced_files(unpacked_dir)
|
|
253
|
+
removed_files = remove_orphaned_files(unpacked_dir, referenced)
|
|
254
|
+
|
|
255
|
+
total_removed = removed_rels + removed_files
|
|
256
|
+
if not total_removed:
|
|
257
|
+
break
|
|
258
|
+
|
|
259
|
+
all_removed.extend(total_removed)
|
|
260
|
+
|
|
261
|
+
if all_removed:
|
|
262
|
+
update_content_types(unpacked_dir, all_removed)
|
|
263
|
+
|
|
264
|
+
return all_removed
|
|
265
|
+
|
|
266
|
+
|
|
267
|
+
if __name__ == "__main__":
|
|
268
|
+
if len(sys.argv) != 2:
|
|
269
|
+
print("Usage: python clean.py <unpacked_dir>", file=sys.stderr)
|
|
270
|
+
print("Example: python clean.py unpacked/", file=sys.stderr)
|
|
271
|
+
sys.exit(1)
|
|
272
|
+
|
|
273
|
+
unpacked_dir = Path(sys.argv[1])
|
|
274
|
+
|
|
275
|
+
if not unpacked_dir.exists():
|
|
276
|
+
print(f"Error: {unpacked_dir} not found", file=sys.stderr)
|
|
277
|
+
sys.exit(1)
|
|
278
|
+
|
|
279
|
+
removed = clean_unused_files(unpacked_dir)
|
|
280
|
+
|
|
281
|
+
if removed:
|
|
282
|
+
print(f"Removed {len(removed)} unreferenced files:")
|
|
283
|
+
for f in removed:
|
|
284
|
+
print(f" {f}")
|
|
285
|
+
else:
|
|
286
|
+
print("No unreferenced files found")
|
|
File without changes
|
|
@@ -0,0 +1,199 @@
|
|
|
1
|
+
"""Merge adjacent runs with identical formatting in DOCX.
|
|
2
|
+
|
|
3
|
+
Merges adjacent <w:r> elements that have identical <w:rPr> properties.
|
|
4
|
+
Works on runs in paragraphs and inside tracked changes (<w:ins>, <w:del>).
|
|
5
|
+
|
|
6
|
+
Also:
|
|
7
|
+
- Removes rsid attributes from runs (revision metadata that doesn't affect rendering)
|
|
8
|
+
- Removes proofErr elements (spell/grammar markers that block merging)
|
|
9
|
+
"""
|
|
10
|
+
|
|
11
|
+
from pathlib import Path
|
|
12
|
+
|
|
13
|
+
import defusedxml.minidom
|
|
14
|
+
|
|
15
|
+
|
|
16
|
+
def merge_runs(input_dir: str) -> tuple[int, str]:
|
|
17
|
+
doc_xml = Path(input_dir) / "word" / "document.xml"
|
|
18
|
+
|
|
19
|
+
if not doc_xml.exists():
|
|
20
|
+
return 0, f"Error: {doc_xml} not found"
|
|
21
|
+
|
|
22
|
+
try:
|
|
23
|
+
dom = defusedxml.minidom.parseString(doc_xml.read_text(encoding="utf-8"))
|
|
24
|
+
root = dom.documentElement
|
|
25
|
+
|
|
26
|
+
_remove_elements(root, "proofErr")
|
|
27
|
+
_strip_run_rsid_attrs(root)
|
|
28
|
+
|
|
29
|
+
containers = {run.parentNode for run in _find_elements(root, "r")}
|
|
30
|
+
|
|
31
|
+
merge_count = 0
|
|
32
|
+
for container in containers:
|
|
33
|
+
merge_count += _merge_runs_in(container)
|
|
34
|
+
|
|
35
|
+
doc_xml.write_bytes(dom.toxml(encoding="UTF-8"))
|
|
36
|
+
return merge_count, f"Merged {merge_count} runs"
|
|
37
|
+
|
|
38
|
+
except Exception as e:
|
|
39
|
+
return 0, f"Error: {e}"
|
|
40
|
+
|
|
41
|
+
|
|
42
|
+
|
|
43
|
+
|
|
44
|
+
def _find_elements(root, tag: str) -> list:
|
|
45
|
+
results = []
|
|
46
|
+
|
|
47
|
+
def traverse(node):
|
|
48
|
+
if node.nodeType == node.ELEMENT_NODE:
|
|
49
|
+
name = node.localName or node.tagName
|
|
50
|
+
if name == tag or name.endswith(f":{tag}"):
|
|
51
|
+
results.append(node)
|
|
52
|
+
for child in node.childNodes:
|
|
53
|
+
traverse(child)
|
|
54
|
+
|
|
55
|
+
traverse(root)
|
|
56
|
+
return results
|
|
57
|
+
|
|
58
|
+
|
|
59
|
+
def _get_child(parent, tag: str):
|
|
60
|
+
for child in parent.childNodes:
|
|
61
|
+
if child.nodeType == child.ELEMENT_NODE:
|
|
62
|
+
name = child.localName or child.tagName
|
|
63
|
+
if name == tag or name.endswith(f":{tag}"):
|
|
64
|
+
return child
|
|
65
|
+
return None
|
|
66
|
+
|
|
67
|
+
|
|
68
|
+
def _get_children(parent, tag: str) -> list:
|
|
69
|
+
results = []
|
|
70
|
+
for child in parent.childNodes:
|
|
71
|
+
if child.nodeType == child.ELEMENT_NODE:
|
|
72
|
+
name = child.localName or child.tagName
|
|
73
|
+
if name == tag or name.endswith(f":{tag}"):
|
|
74
|
+
results.append(child)
|
|
75
|
+
return results
|
|
76
|
+
|
|
77
|
+
|
|
78
|
+
def _is_adjacent(elem1, elem2) -> bool:
|
|
79
|
+
node = elem1.nextSibling
|
|
80
|
+
while node:
|
|
81
|
+
if node == elem2:
|
|
82
|
+
return True
|
|
83
|
+
if node.nodeType == node.ELEMENT_NODE:
|
|
84
|
+
return False
|
|
85
|
+
if node.nodeType == node.TEXT_NODE and node.data.strip():
|
|
86
|
+
return False
|
|
87
|
+
node = node.nextSibling
|
|
88
|
+
return False
|
|
89
|
+
|
|
90
|
+
|
|
91
|
+
|
|
92
|
+
|
|
93
|
+
def _remove_elements(root, tag: str):
|
|
94
|
+
for elem in _find_elements(root, tag):
|
|
95
|
+
if elem.parentNode:
|
|
96
|
+
elem.parentNode.removeChild(elem)
|
|
97
|
+
|
|
98
|
+
|
|
99
|
+
def _strip_run_rsid_attrs(root):
|
|
100
|
+
for run in _find_elements(root, "r"):
|
|
101
|
+
for attr in list(run.attributes.values()):
|
|
102
|
+
if "rsid" in attr.name.lower():
|
|
103
|
+
run.removeAttribute(attr.name)
|
|
104
|
+
|
|
105
|
+
|
|
106
|
+
|
|
107
|
+
|
|
108
|
+
def _merge_runs_in(container) -> int:
|
|
109
|
+
merge_count = 0
|
|
110
|
+
run = _first_child_run(container)
|
|
111
|
+
|
|
112
|
+
while run:
|
|
113
|
+
while True:
|
|
114
|
+
next_elem = _next_element_sibling(run)
|
|
115
|
+
if next_elem and _is_run(next_elem) and _can_merge(run, next_elem):
|
|
116
|
+
_merge_run_content(run, next_elem)
|
|
117
|
+
container.removeChild(next_elem)
|
|
118
|
+
merge_count += 1
|
|
119
|
+
else:
|
|
120
|
+
break
|
|
121
|
+
|
|
122
|
+
_consolidate_text(run)
|
|
123
|
+
run = _next_sibling_run(run)
|
|
124
|
+
|
|
125
|
+
return merge_count
|
|
126
|
+
|
|
127
|
+
|
|
128
|
+
def _first_child_run(container):
|
|
129
|
+
for child in container.childNodes:
|
|
130
|
+
if child.nodeType == child.ELEMENT_NODE and _is_run(child):
|
|
131
|
+
return child
|
|
132
|
+
return None
|
|
133
|
+
|
|
134
|
+
|
|
135
|
+
def _next_element_sibling(node):
|
|
136
|
+
sibling = node.nextSibling
|
|
137
|
+
while sibling:
|
|
138
|
+
if sibling.nodeType == sibling.ELEMENT_NODE:
|
|
139
|
+
return sibling
|
|
140
|
+
sibling = sibling.nextSibling
|
|
141
|
+
return None
|
|
142
|
+
|
|
143
|
+
|
|
144
|
+
def _next_sibling_run(node):
|
|
145
|
+
sibling = node.nextSibling
|
|
146
|
+
while sibling:
|
|
147
|
+
if sibling.nodeType == sibling.ELEMENT_NODE:
|
|
148
|
+
if _is_run(sibling):
|
|
149
|
+
return sibling
|
|
150
|
+
sibling = sibling.nextSibling
|
|
151
|
+
return None
|
|
152
|
+
|
|
153
|
+
|
|
154
|
+
def _is_run(node) -> bool:
|
|
155
|
+
name = node.localName or node.tagName
|
|
156
|
+
return name == "r" or name.endswith(":r")
|
|
157
|
+
|
|
158
|
+
|
|
159
|
+
def _can_merge(run1, run2) -> bool:
|
|
160
|
+
rpr1 = _get_child(run1, "rPr")
|
|
161
|
+
rpr2 = _get_child(run2, "rPr")
|
|
162
|
+
|
|
163
|
+
if (rpr1 is None) != (rpr2 is None):
|
|
164
|
+
return False
|
|
165
|
+
if rpr1 is None:
|
|
166
|
+
return True
|
|
167
|
+
return rpr1.toxml() == rpr2.toxml()
|
|
168
|
+
|
|
169
|
+
|
|
170
|
+
def _merge_run_content(target, source):
|
|
171
|
+
for child in list(source.childNodes):
|
|
172
|
+
if child.nodeType == child.ELEMENT_NODE:
|
|
173
|
+
name = child.localName or child.tagName
|
|
174
|
+
if name != "rPr" and not name.endswith(":rPr"):
|
|
175
|
+
target.appendChild(child)
|
|
176
|
+
|
|
177
|
+
|
|
178
|
+
def _consolidate_text(run):
|
|
179
|
+
t_elements = _get_children(run, "t")
|
|
180
|
+
|
|
181
|
+
for i in range(len(t_elements) - 1, 0, -1):
|
|
182
|
+
curr, prev = t_elements[i], t_elements[i - 1]
|
|
183
|
+
|
|
184
|
+
if _is_adjacent(prev, curr):
|
|
185
|
+
prev_text = prev.firstChild.data if prev.firstChild else ""
|
|
186
|
+
curr_text = curr.firstChild.data if curr.firstChild else ""
|
|
187
|
+
merged = prev_text + curr_text
|
|
188
|
+
|
|
189
|
+
if prev.firstChild:
|
|
190
|
+
prev.firstChild.data = merged
|
|
191
|
+
else:
|
|
192
|
+
prev.appendChild(run.ownerDocument.createTextNode(merged))
|
|
193
|
+
|
|
194
|
+
if merged.startswith(" ") or merged.endswith(" "):
|
|
195
|
+
prev.setAttribute("xml:space", "preserve")
|
|
196
|
+
elif prev.hasAttribute("xml:space"):
|
|
197
|
+
prev.removeAttribute("xml:space")
|
|
198
|
+
|
|
199
|
+
run.removeChild(curr)
|
|
@@ -0,0 +1,197 @@
|
|
|
1
|
+
"""Simplify tracked changes by merging adjacent w:ins or w:del elements.
|
|
2
|
+
|
|
3
|
+
Merges adjacent <w:ins> elements from the same author into a single element.
|
|
4
|
+
Same for <w:del> elements. This makes heavily-redlined documents easier to
|
|
5
|
+
work with by reducing the number of tracked change wrappers.
|
|
6
|
+
|
|
7
|
+
Rules:
|
|
8
|
+
- Only merges w:ins with w:ins, w:del with w:del (same element type)
|
|
9
|
+
- Only merges if same author (ignores timestamp differences)
|
|
10
|
+
- Only merges if truly adjacent (only whitespace between them)
|
|
11
|
+
"""
|
|
12
|
+
|
|
13
|
+
import xml.etree.ElementTree as ET
|
|
14
|
+
import zipfile
|
|
15
|
+
from pathlib import Path
|
|
16
|
+
|
|
17
|
+
import defusedxml.minidom
|
|
18
|
+
|
|
19
|
+
WORD_NS = "http://schemas.openxmlformats.org/wordprocessingml/2006/main"
|
|
20
|
+
|
|
21
|
+
|
|
22
|
+
def simplify_redlines(input_dir: str) -> tuple[int, str]:
|
|
23
|
+
doc_xml = Path(input_dir) / "word" / "document.xml"
|
|
24
|
+
|
|
25
|
+
if not doc_xml.exists():
|
|
26
|
+
return 0, f"Error: {doc_xml} not found"
|
|
27
|
+
|
|
28
|
+
try:
|
|
29
|
+
dom = defusedxml.minidom.parseString(doc_xml.read_text(encoding="utf-8"))
|
|
30
|
+
root = dom.documentElement
|
|
31
|
+
|
|
32
|
+
merge_count = 0
|
|
33
|
+
|
|
34
|
+
containers = _find_elements(root, "p") + _find_elements(root, "tc")
|
|
35
|
+
|
|
36
|
+
for container in containers:
|
|
37
|
+
merge_count += _merge_tracked_changes_in(container, "ins")
|
|
38
|
+
merge_count += _merge_tracked_changes_in(container, "del")
|
|
39
|
+
|
|
40
|
+
doc_xml.write_bytes(dom.toxml(encoding="UTF-8"))
|
|
41
|
+
return merge_count, f"Simplified {merge_count} tracked changes"
|
|
42
|
+
|
|
43
|
+
except Exception as e:
|
|
44
|
+
return 0, f"Error: {e}"
|
|
45
|
+
|
|
46
|
+
|
|
47
|
+
def _merge_tracked_changes_in(container, tag: str) -> int:
|
|
48
|
+
merge_count = 0
|
|
49
|
+
|
|
50
|
+
tracked = [
|
|
51
|
+
child
|
|
52
|
+
for child in container.childNodes
|
|
53
|
+
if child.nodeType == child.ELEMENT_NODE and _is_element(child, tag)
|
|
54
|
+
]
|
|
55
|
+
|
|
56
|
+
if len(tracked) < 2:
|
|
57
|
+
return 0
|
|
58
|
+
|
|
59
|
+
i = 0
|
|
60
|
+
while i < len(tracked) - 1:
|
|
61
|
+
curr = tracked[i]
|
|
62
|
+
next_elem = tracked[i + 1]
|
|
63
|
+
|
|
64
|
+
if _can_merge_tracked(curr, next_elem):
|
|
65
|
+
_merge_tracked_content(curr, next_elem)
|
|
66
|
+
container.removeChild(next_elem)
|
|
67
|
+
tracked.pop(i + 1)
|
|
68
|
+
merge_count += 1
|
|
69
|
+
else:
|
|
70
|
+
i += 1
|
|
71
|
+
|
|
72
|
+
return merge_count
|
|
73
|
+
|
|
74
|
+
|
|
75
|
+
def _is_element(node, tag: str) -> bool:
|
|
76
|
+
name = node.localName or node.tagName
|
|
77
|
+
return name == tag or name.endswith(f":{tag}")
|
|
78
|
+
|
|
79
|
+
|
|
80
|
+
def _get_author(elem) -> str:
|
|
81
|
+
author = elem.getAttribute("w:author")
|
|
82
|
+
if not author:
|
|
83
|
+
for attr in elem.attributes.values():
|
|
84
|
+
if attr.localName == "author" or attr.name.endswith(":author"):
|
|
85
|
+
return attr.value
|
|
86
|
+
return author
|
|
87
|
+
|
|
88
|
+
|
|
89
|
+
def _can_merge_tracked(elem1, elem2) -> bool:
|
|
90
|
+
if _get_author(elem1) != _get_author(elem2):
|
|
91
|
+
return False
|
|
92
|
+
|
|
93
|
+
node = elem1.nextSibling
|
|
94
|
+
while node and node != elem2:
|
|
95
|
+
if node.nodeType == node.ELEMENT_NODE:
|
|
96
|
+
return False
|
|
97
|
+
if node.nodeType == node.TEXT_NODE and node.data.strip():
|
|
98
|
+
return False
|
|
99
|
+
node = node.nextSibling
|
|
100
|
+
|
|
101
|
+
return True
|
|
102
|
+
|
|
103
|
+
|
|
104
|
+
def _merge_tracked_content(target, source):
|
|
105
|
+
while source.firstChild:
|
|
106
|
+
child = source.firstChild
|
|
107
|
+
source.removeChild(child)
|
|
108
|
+
target.appendChild(child)
|
|
109
|
+
|
|
110
|
+
|
|
111
|
+
def _find_elements(root, tag: str) -> list:
|
|
112
|
+
results = []
|
|
113
|
+
|
|
114
|
+
def traverse(node):
|
|
115
|
+
if node.nodeType == node.ELEMENT_NODE:
|
|
116
|
+
name = node.localName or node.tagName
|
|
117
|
+
if name == tag or name.endswith(f":{tag}"):
|
|
118
|
+
results.append(node)
|
|
119
|
+
for child in node.childNodes:
|
|
120
|
+
traverse(child)
|
|
121
|
+
|
|
122
|
+
traverse(root)
|
|
123
|
+
return results
|
|
124
|
+
|
|
125
|
+
|
|
126
|
+
def get_tracked_change_authors(doc_xml_path: Path) -> dict[str, int]:
|
|
127
|
+
if not doc_xml_path.exists():
|
|
128
|
+
return {}
|
|
129
|
+
|
|
130
|
+
try:
|
|
131
|
+
tree = ET.parse(doc_xml_path)
|
|
132
|
+
root = tree.getroot()
|
|
133
|
+
except ET.ParseError:
|
|
134
|
+
return {}
|
|
135
|
+
|
|
136
|
+
namespaces = {"w": WORD_NS}
|
|
137
|
+
author_attr = f"{{{WORD_NS}}}author"
|
|
138
|
+
|
|
139
|
+
authors: dict[str, int] = {}
|
|
140
|
+
for tag in ["ins", "del"]:
|
|
141
|
+
for elem in root.findall(f".//w:{tag}", namespaces):
|
|
142
|
+
author = elem.get(author_attr)
|
|
143
|
+
if author:
|
|
144
|
+
authors[author] = authors.get(author, 0) + 1
|
|
145
|
+
|
|
146
|
+
return authors
|
|
147
|
+
|
|
148
|
+
|
|
149
|
+
def _get_authors_from_docx(docx_path: Path) -> dict[str, int]:
|
|
150
|
+
try:
|
|
151
|
+
with zipfile.ZipFile(docx_path, "r") as zf:
|
|
152
|
+
if "word/document.xml" not in zf.namelist():
|
|
153
|
+
return {}
|
|
154
|
+
with zf.open("word/document.xml") as f:
|
|
155
|
+
tree = ET.parse(f)
|
|
156
|
+
root = tree.getroot()
|
|
157
|
+
|
|
158
|
+
namespaces = {"w": WORD_NS}
|
|
159
|
+
author_attr = f"{{{WORD_NS}}}author"
|
|
160
|
+
|
|
161
|
+
authors: dict[str, int] = {}
|
|
162
|
+
for tag in ["ins", "del"]:
|
|
163
|
+
for elem in root.findall(f".//w:{tag}", namespaces):
|
|
164
|
+
author = elem.get(author_attr)
|
|
165
|
+
if author:
|
|
166
|
+
authors[author] = authors.get(author, 0) + 1
|
|
167
|
+
return authors
|
|
168
|
+
except (zipfile.BadZipFile, ET.ParseError):
|
|
169
|
+
return {}
|
|
170
|
+
|
|
171
|
+
|
|
172
|
+
def infer_author(modified_dir: Path, original_docx: Path, default: str = "Claude") -> str:
|
|
173
|
+
modified_xml = modified_dir / "word" / "document.xml"
|
|
174
|
+
modified_authors = get_tracked_change_authors(modified_xml)
|
|
175
|
+
|
|
176
|
+
if not modified_authors:
|
|
177
|
+
return default
|
|
178
|
+
|
|
179
|
+
original_authors = _get_authors_from_docx(original_docx)
|
|
180
|
+
|
|
181
|
+
new_changes: dict[str, int] = {}
|
|
182
|
+
for author, count in modified_authors.items():
|
|
183
|
+
original_count = original_authors.get(author, 0)
|
|
184
|
+
diff = count - original_count
|
|
185
|
+
if diff > 0:
|
|
186
|
+
new_changes[author] = diff
|
|
187
|
+
|
|
188
|
+
if not new_changes:
|
|
189
|
+
return default
|
|
190
|
+
|
|
191
|
+
if len(new_changes) == 1:
|
|
192
|
+
return next(iter(new_changes))
|
|
193
|
+
|
|
194
|
+
raise ValueError(
|
|
195
|
+
f"Multiple authors added new changes: {new_changes}. "
|
|
196
|
+
"Cannot infer which author to validate."
|
|
197
|
+
)
|