uniword 1.0.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +7 -0
- data/CHANGELOG.md +428 -0
- data/CONTRIBUTING.md +479 -0
- data/LICENSE.txt +25 -0
- data/README.adoc +2186 -0
- data/exe/uniword +6 -0
- data/lib/uniword/accessibility/accessibility_checker.rb +115 -0
- data/lib/uniword/accessibility/accessibility_profile.rb +133 -0
- data/lib/uniword/accessibility/accessibility_report.rb +212 -0
- data/lib/uniword/accessibility/accessibility_rule.rb +93 -0
- data/lib/uniword/accessibility/accessibility_violation.rb +80 -0
- data/lib/uniword/accessibility/rules/color_usage_rule.rb +30 -0
- data/lib/uniword/accessibility/rules/contrast_ratio_rule.rb +31 -0
- data/lib/uniword/accessibility/rules/descriptive_headings_rule.rb +99 -0
- data/lib/uniword/accessibility/rules/document_title_rule.rb +64 -0
- data/lib/uniword/accessibility/rules/heading_structure_rule.rb +127 -0
- data/lib/uniword/accessibility/rules/image_alt_text_rule.rb +89 -0
- data/lib/uniword/accessibility/rules/language_specification_rule.rb +55 -0
- data/lib/uniword/accessibility/rules/list_structure_rule.rb +33 -0
- data/lib/uniword/accessibility/rules/reading_order_rule.rb +30 -0
- data/lib/uniword/accessibility/rules/table_headers_rule.rb +61 -0
- data/lib/uniword/accessibility/rules.rb +18 -0
- data/lib/uniword/accessibility.rb +12 -0
- data/lib/uniword/assembly/assembly_manifest.rb +189 -0
- data/lib/uniword/assembly/component_registry.rb +260 -0
- data/lib/uniword/assembly/cross_reference_resolver.rb +241 -0
- data/lib/uniword/assembly/document_assembler.rb +296 -0
- data/lib/uniword/assembly/toc.rb +227 -0
- data/lib/uniword/assembly/toc_entry.rb +124 -0
- data/lib/uniword/assembly/toc_instruction.rb +92 -0
- data/lib/uniword/assembly/variable_substitutor.rb +238 -0
- data/lib/uniword/assembly.rb +14 -0
- data/lib/uniword/batch/batch_result.rb +244 -0
- data/lib/uniword/batch/document_processor.rb +339 -0
- data/lib/uniword/batch/processing_stage.rb +92 -0
- data/lib/uniword/batch/stages/compress_images_stage.rb +187 -0
- data/lib/uniword/batch/stages/convert_format_stage.rb +117 -0
- data/lib/uniword/batch/stages/normalize_styles_stage.rb +174 -0
- data/lib/uniword/batch/stages/quality_check_stage.rb +149 -0
- data/lib/uniword/batch/stages/update_metadata_stage.rb +103 -0
- data/lib/uniword/batch/stages/validate_links_stage.rb +203 -0
- data/lib/uniword/batch.rb +16 -0
- data/lib/uniword/bibliography/author.rb +80 -0
- data/lib/uniword/bibliography/city.rb +22 -0
- data/lib/uniword/bibliography/corporate.rb +22 -0
- data/lib/uniword/bibliography/day.rb +22 -0
- data/lib/uniword/bibliography/edition.rb +22 -0
- data/lib/uniword/bibliography/first.rb +22 -0
- data/lib/uniword/bibliography/first_name.rb +22 -0
- data/lib/uniword/bibliography/guid.rb +22 -0
- data/lib/uniword/bibliography/issue.rb +22 -0
- data/lib/uniword/bibliography/last.rb +22 -0
- data/lib/uniword/bibliography/last_name.rb +22 -0
- data/lib/uniword/bibliography/lcid.rb +22 -0
- data/lib/uniword/bibliography/locale_id.rb +22 -0
- data/lib/uniword/bibliography/month.rb +22 -0
- data/lib/uniword/bibliography/name_list.rb +23 -0
- data/lib/uniword/bibliography/pages.rb +22 -0
- data/lib/uniword/bibliography/person.rb +27 -0
- data/lib/uniword/bibliography/publisher.rb +22 -0
- data/lib/uniword/bibliography/ref_order.rb +22 -0
- data/lib/uniword/bibliography/source.rb +169 -0
- data/lib/uniword/bibliography/source_tag.rb +22 -0
- data/lib/uniword/bibliography/source_type.rb +22 -0
- data/lib/uniword/bibliography/sources.rb +29 -0
- data/lib/uniword/bibliography/tag.rb +22 -0
- data/lib/uniword/bibliography/title.rb +22 -0
- data/lib/uniword/bibliography/url.rb +22 -0
- data/lib/uniword/bibliography/volume_number.rb +22 -0
- data/lib/uniword/bibliography/year.rb +22 -0
- data/lib/uniword/bibliography.rb +45 -0
- data/lib/uniword/bookmark.rb +103 -0
- data/lib/uniword/builder/bibliography_builder.rb +188 -0
- data/lib/uniword/builder/chart_builder.rb +365 -0
- data/lib/uniword/builder/comment_builder.rb +54 -0
- data/lib/uniword/builder/document_builder.rb +548 -0
- data/lib/uniword/builder/footnote_builder.rb +102 -0
- data/lib/uniword/builder/header_footer_builder.rb +79 -0
- data/lib/uniword/builder/image_builder.rb +316 -0
- data/lib/uniword/builder/list_builder.rb +51 -0
- data/lib/uniword/builder/numbering_builder.rb +42 -0
- data/lib/uniword/builder/paragraph_builder.rb +228 -0
- data/lib/uniword/builder/run_builder.rb +285 -0
- data/lib/uniword/builder/sdt_builder.rb +205 -0
- data/lib/uniword/builder/section_builder.rb +170 -0
- data/lib/uniword/builder/style_builder.rb +129 -0
- data/lib/uniword/builder/table_builder.rb +111 -0
- data/lib/uniword/builder/table_cell_builder.rb +138 -0
- data/lib/uniword/builder/table_row_builder.rb +65 -0
- data/lib/uniword/builder/theme_builder.rb +98 -0
- data/lib/uniword/builder/toc_builder.rb +54 -0
- data/lib/uniword/builder/watermark_builder.rb +95 -0
- data/lib/uniword/builder.rb +232 -0
- data/lib/uniword/chart/area3_d_chart.rb +35 -0
- data/lib/uniword/chart/area_chart.rb +33 -0
- data/lib/uniword/chart/auto_title_deleted.rb +22 -0
- data/lib/uniword/chart/axis_id.rb +22 -0
- data/lib/uniword/chart/axis_position.rb +22 -0
- data/lib/uniword/chart/bar3_d_chart.rb +39 -0
- data/lib/uniword/chart/bar_chart.rb +37 -0
- data/lib/uniword/chart/bubble_chart.rb +37 -0
- data/lib/uniword/chart/bubble_size.rb +25 -0
- data/lib/uniword/chart/cat_ax.rb +45 -0
- data/lib/uniword/chart/category_axis_data.rb +29 -0
- data/lib/uniword/chart/chart.rb +33 -0
- data/lib/uniword/chart/chart_reference.rb +24 -0
- data/lib/uniword/chart/chart_space.rb +35 -0
- data/lib/uniword/chart/color_map_override.rb +22 -0
- data/lib/uniword/chart/data_label.rb +35 -0
- data/lib/uniword/chart/data_labels.rb +41 -0
- data/lib/uniword/chart/date_ax.rb +45 -0
- data/lib/uniword/chart/diagram_reference.rb +24 -0
- data/lib/uniword/chart/doughnut_chart.rb +31 -0
- data/lib/uniword/chart/drop_lines.rb +23 -0
- data/lib/uniword/chart/error_bar_type.rb +22 -0
- data/lib/uniword/chart/error_bars.rb +37 -0
- data/lib/uniword/chart/error_direction.rb +22 -0
- data/lib/uniword/chart/explosion.rb +22 -0
- data/lib/uniword/chart/gap_width.rb +22 -0
- data/lib/uniword/chart/hi_low_lines.rb +23 -0
- data/lib/uniword/chart/index.rb +22 -0
- data/lib/uniword/chart/layout.rb +23 -0
- data/lib/uniword/chart/legend.rb +33 -0
- data/lib/uniword/chart/legend_entry.rb +27 -0
- data/lib/uniword/chart/legend_position.rb +22 -0
- data/lib/uniword/chart/line3_d_chart.rb +35 -0
- data/lib/uniword/chart/line_chart.rb +41 -0
- data/lib/uniword/chart/major_gridlines.rb +23 -0
- data/lib/uniword/chart/marker.rb +27 -0
- data/lib/uniword/chart/marker_size.rb +22 -0
- data/lib/uniword/chart/marker_style.rb +22 -0
- data/lib/uniword/chart/minor_gridlines.rb +23 -0
- data/lib/uniword/chart/number_reference.rb +25 -0
- data/lib/uniword/chart/numbering_format.rb +24 -0
- data/lib/uniword/chart/order.rb +22 -0
- data/lib/uniword/chart/orientation.rb +22 -0
- data/lib/uniword/chart/pie3_d_chart.rb +27 -0
- data/lib/uniword/chart/pie_chart.rb +29 -0
- data/lib/uniword/chart/plot_area.rb +35 -0
- data/lib/uniword/chart/plot_vis_only.rb +22 -0
- data/lib/uniword/chart/radar_chart.rb +31 -0
- data/lib/uniword/chart/scaling.rb +29 -0
- data/lib/uniword/chart/scatter_chart.rb +31 -0
- data/lib/uniword/chart/ser_ax.rb +43 -0
- data/lib/uniword/chart/series.rb +29 -0
- data/lib/uniword/chart/series_text.rb +25 -0
- data/lib/uniword/chart/shape_properties.rb +22 -0
- data/lib/uniword/chart/show_category_name.rb +22 -0
- data/lib/uniword/chart/show_legend_key.rb +22 -0
- data/lib/uniword/chart/show_value.rb +22 -0
- data/lib/uniword/chart/smooth.rb +22 -0
- data/lib/uniword/chart/stock_chart.rb +33 -0
- data/lib/uniword/chart/style.rb +22 -0
- data/lib/uniword/chart/surface3_d_chart.rb +29 -0
- data/lib/uniword/chart/surface_chart.rb +29 -0
- data/lib/uniword/chart/text_properties.rb +22 -0
- data/lib/uniword/chart/tick_label_position.rb +22 -0
- data/lib/uniword/chart/title.rb +31 -0
- data/lib/uniword/chart/trendline.rb +35 -0
- data/lib/uniword/chart/trendline_type.rb +22 -0
- data/lib/uniword/chart/up_down_bars.rb +27 -0
- data/lib/uniword/chart/val_ax.rb +49 -0
- data/lib/uniword/chart/values.rb +25 -0
- data/lib/uniword/chart/x_values.rb +25 -0
- data/lib/uniword/chart/y_values.rb +25 -0
- data/lib/uniword/chart.rb +105 -0
- data/lib/uniword/cli.rb +737 -0
- data/lib/uniword/column_configuration.rb +111 -0
- data/lib/uniword/comment.rb +147 -0
- data/lib/uniword/comment_range.rb +122 -0
- data/lib/uniword/comments_part.rb +130 -0
- data/lib/uniword/configuration/configuration_loader.rb +168 -0
- data/lib/uniword/configuration.rb +7 -0
- data/lib/uniword/content_types/default.rb +24 -0
- data/lib/uniword/content_types/override.rb +24 -0
- data/lib/uniword/content_types/types.rb +26 -0
- data/lib/uniword/content_types.rb +76 -0
- data/lib/uniword/customxml/custom_xml.rb +29 -0
- data/lib/uniword/customxml/custom_xml_attribute.rb +26 -0
- data/lib/uniword/customxml/custom_xml_block.rb +29 -0
- data/lib/uniword/customxml/custom_xml_cell.rb +29 -0
- data/lib/uniword/customxml/custom_xml_del_range_start.rb +26 -0
- data/lib/uniword/customxml/custom_xml_ins_range_end.rb +22 -0
- data/lib/uniword/customxml/custom_xml_ins_range_start.rb +26 -0
- data/lib/uniword/customxml/custom_xml_move_from_range_end.rb +22 -0
- data/lib/uniword/customxml/custom_xml_move_from_range_start.rb +26 -0
- data/lib/uniword/customxml/custom_xml_move_to_range_end.rb +22 -0
- data/lib/uniword/customxml/custom_xml_move_to_range_start.rb +26 -0
- data/lib/uniword/customxml/custom_xml_properties.rb +27 -0
- data/lib/uniword/customxml/custom_xml_row.rb +29 -0
- data/lib/uniword/customxml/custom_xml_run.rb +29 -0
- data/lib/uniword/customxml/data_binding.rb +26 -0
- data/lib/uniword/customxml/data_store_item.rb +24 -0
- data/lib/uniword/customxml/element_name.rb +22 -0
- data/lib/uniword/customxml/name.rb +22 -0
- data/lib/uniword/customxml/namespace_uri.rb +22 -0
- data/lib/uniword/customxml/placeholder.rb +22 -0
- data/lib/uniword/customxml/placeholder_text.rb +22 -0
- data/lib/uniword/customxml/prefix_mappings.rb +22 -0
- data/lib/uniword/customxml/schema_reference.rb +41 -0
- data/lib/uniword/customxml/showing_placeholder.rb +24 -0
- data/lib/uniword/customxml/showing_placeholder_header.rb +22 -0
- data/lib/uniword/customxml/smart_tag.rb +29 -0
- data/lib/uniword/customxml/smart_tag_attribute.rb +24 -0
- data/lib/uniword/customxml/smart_tag_element.rb +22 -0
- data/lib/uniword/customxml/smart_tag_name.rb +22 -0
- data/lib/uniword/customxml/smart_tag_properties.rb +23 -0
- data/lib/uniword/customxml/smart_tag_type.rb +26 -0
- data/lib/uniword/customxml/smart_tag_uri.rb +22 -0
- data/lib/uniword/customxml/store_item_id.rb +22 -0
- data/lib/uniword/customxml/x_path.rb +22 -0
- data/lib/uniword/customxml/x_path_expression.rb +22 -0
- data/lib/uniword/customxml.rb +53 -0
- data/lib/uniword/document_factory.rb +214 -0
- data/lib/uniword/document_properties/app_version.rb +22 -0
- data/lib/uniword/document_properties/application.rb +22 -0
- data/lib/uniword/document_properties/bool_value.rb +22 -0
- data/lib/uniword/document_properties/company.rb +22 -0
- data/lib/uniword/document_properties/custom_properties.rb +23 -0
- data/lib/uniword/document_properties/custom_property.rb +37 -0
- data/lib/uniword/document_properties/doc_security.rb +22 -0
- data/lib/uniword/document_properties/extended_properties.rb +41 -0
- data/lib/uniword/document_properties/file_time.rb +22 -0
- data/lib/uniword/document_properties/heading_pairs.rb +23 -0
- data/lib/uniword/document_properties/hyperlinks_changed.rb +22 -0
- data/lib/uniword/document_properties/i4.rb +22 -0
- data/lib/uniword/document_properties/links_up_to_date.rb +22 -0
- data/lib/uniword/document_properties/lpw_str.rb +22 -0
- data/lib/uniword/document_properties/manager.rb +22 -0
- data/lib/uniword/document_properties/scale_crop.rb +22 -0
- data/lib/uniword/document_properties/shared_doc.rb +22 -0
- data/lib/uniword/document_properties/titles_of_parts.rb +23 -0
- data/lib/uniword/document_properties/variant.rb +25 -0
- data/lib/uniword/document_properties/vector.rb +27 -0
- data/lib/uniword/document_properties.rb +32 -0
- data/lib/uniword/document_variables/data_type.rb +22 -0
- data/lib/uniword/document_variables/default_value.rb +22 -0
- data/lib/uniword/document_variables/doc_var.rb +24 -0
- data/lib/uniword/document_variables/doc_vars.rb +23 -0
- data/lib/uniword/document_variables/read_only.rb +24 -0
- data/lib/uniword/document_variables/variable_binding.rb +26 -0
- data/lib/uniword/document_variables/variable_collection.rb +25 -0
- data/lib/uniword/document_variables/variable_expression.rb +22 -0
- data/lib/uniword/document_variables/variable_format.rb +22 -0
- data/lib/uniword/document_variables/variable_scope.rb +22 -0
- data/lib/uniword/document_variables.rb +23 -0
- data/lib/uniword/document_writer.rb +157 -0
- data/lib/uniword/drawingml/adjust_value_list.rb +22 -0
- data/lib/uniword/drawingml/alpha.rb +22 -0
- data/lib/uniword/drawingml/alpha_bi_level.rb +22 -0
- data/lib/uniword/drawingml/alpha_modulation.rb +22 -0
- data/lib/uniword/drawingml/alpha_modulation_fixed.rb +22 -0
- data/lib/uniword/drawingml/alpha_offset.rb +22 -0
- data/lib/uniword/drawingml/arc_to.rb +28 -0
- data/lib/uniword/drawingml/background_color.rb +24 -0
- data/lib/uniword/drawingml/bevel_top.rb +26 -0
- data/lib/uniword/drawingml/bi_level.rb +22 -0
- data/lib/uniword/drawingml/blip.rb +30 -0
- data/lib/uniword/drawingml/blip_fill.rb +28 -0
- data/lib/uniword/drawingml/blue.rb +22 -0
- data/lib/uniword/drawingml/blur.rb +24 -0
- data/lib/uniword/drawingml/body_properties.rb +22 -0
- data/lib/uniword/drawingml/camera.rb +24 -0
- data/lib/uniword/drawingml/close_path.rb +18 -0
- data/lib/uniword/drawingml/color_scheme.rb +381 -0
- data/lib/uniword/drawingml/complex_script_font.rb +24 -0
- data/lib/uniword/drawingml/custom_dash.rb +22 -0
- data/lib/uniword/drawingml/custom_geometry.rb +24 -0
- data/lib/uniword/drawingml/dash_stop.rb +24 -0
- data/lib/uniword/drawingml/default_paragraph_properties.rb +24 -0
- data/lib/uniword/drawingml/duotone.rb +22 -0
- data/lib/uniword/drawingml/east_asian_font.rb +24 -0
- data/lib/uniword/drawingml/effect_container.rb +22 -0
- data/lib/uniword/drawingml/effect_list.rb +30 -0
- data/lib/uniword/drawingml/extension.rb +53 -0
- data/lib/uniword/drawingml/extension_list.rb +25 -0
- data/lib/uniword/drawingml/extents.rb +24 -0
- data/lib/uniword/drawingml/extra_color_scheme_list.rb +20 -0
- data/lib/uniword/drawingml/fill_overlay.rb +22 -0
- data/lib/uniword/drawingml/fill_to_rect.rb +28 -0
- data/lib/uniword/drawingml/font_reference.rb +23 -0
- data/lib/uniword/drawingml/font_scheme.rb +241 -0
- data/lib/uniword/drawingml/foreground_color.rb +24 -0
- data/lib/uniword/drawingml/format_scheme.rb +141 -0
- data/lib/uniword/drawingml/gamma.rb +18 -0
- data/lib/uniword/drawingml/geometry_guide.rb +24 -0
- data/lib/uniword/drawingml/glow.rb +26 -0
- data/lib/uniword/drawingml/gradient_fill.rb +29 -0
- data/lib/uniword/drawingml/gradient_stop.rb +26 -0
- data/lib/uniword/drawingml/gradient_stop_list.rb +23 -0
- data/lib/uniword/drawingml/graphic.rb +21 -0
- data/lib/uniword/drawingml/graphic_data.rb +27 -0
- data/lib/uniword/drawingml/grayscale.rb +18 -0
- data/lib/uniword/drawingml/green.rb +22 -0
- data/lib/uniword/drawingml/group_locking.rb +35 -0
- data/lib/uniword/drawingml/group_shape_properties.rb +21 -0
- data/lib/uniword/drawingml/gvml.rb +26 -0
- data/lib/uniword/drawingml/gvml_connector.rb +25 -0
- data/lib/uniword/drawingml/gvml_connector_non_visual.rb +23 -0
- data/lib/uniword/drawingml/gvml_graphic_frame_non_visual.rb +23 -0
- data/lib/uniword/drawingml/gvml_graphical_object_frame.rb +25 -0
- data/lib/uniword/drawingml/gvml_group_shape.rb +36 -0
- data/lib/uniword/drawingml/gvml_group_shape_non_visual.rb +23 -0
- data/lib/uniword/drawingml/gvml_picture.rb +27 -0
- data/lib/uniword/drawingml/gvml_picture_non_visual.rb +23 -0
- data/lib/uniword/drawingml/gvml_shape.rb +27 -0
- data/lib/uniword/drawingml/gvml_shape_non_visual.rb +23 -0
- data/lib/uniword/drawingml/gvml_text_shape.rb +25 -0
- data/lib/uniword/drawingml/gvml_use_shape_rectangle.rb +17 -0
- data/lib/uniword/drawingml/hue.rb +22 -0
- data/lib/uniword/drawingml/hue_modulation.rb +22 -0
- data/lib/uniword/drawingml/hue_offset.rb +22 -0
- data/lib/uniword/drawingml/inner_shadow.rb +30 -0
- data/lib/uniword/drawingml/inverse_gamma.rb +18 -0
- data/lib/uniword/drawingml/level1_paragraph_properties.rb +24 -0
- data/lib/uniword/drawingml/level2_paragraph_properties.rb +24 -0
- data/lib/uniword/drawingml/level3_paragraph_properties.rb +24 -0
- data/lib/uniword/drawingml/light_rig.rb +26 -0
- data/lib/uniword/drawingml/line_defaults.rb +27 -0
- data/lib/uniword/drawingml/line_join_miter.rb +22 -0
- data/lib/uniword/drawingml/line_join_round.rb +18 -0
- data/lib/uniword/drawingml/line_properties.rb +36 -0
- data/lib/uniword/drawingml/line_to.rb +22 -0
- data/lib/uniword/drawingml/linear_gradient.rb +24 -0
- data/lib/uniword/drawingml/list_style.rb +28 -0
- data/lib/uniword/drawingml/luminance.rb +22 -0
- data/lib/uniword/drawingml/luminance_modulation.rb +22 -0
- data/lib/uniword/drawingml/luminance_offset.rb +22 -0
- data/lib/uniword/drawingml/move_to.rb +22 -0
- data/lib/uniword/drawingml/no_fill.rb +18 -0
- data/lib/uniword/drawingml/non_visual_connector_properties.rb +21 -0
- data/lib/uniword/drawingml/non_visual_drawing_properties.rb +24 -0
- data/lib/uniword/drawingml/non_visual_graphic_frame_properties.rb +21 -0
- data/lib/uniword/drawingml/non_visual_group_drawing_shape_properties.rb +21 -0
- data/lib/uniword/drawingml/non_visual_picture_properties.rb +25 -0
- data/lib/uniword/drawingml/non_visual_shape_properties.rb +22 -0
- data/lib/uniword/drawingml/object_defaults.rb +23 -0
- data/lib/uniword/drawingml/office_art_extension.rb +21 -0
- data/lib/uniword/drawingml/office_art_extension_list.rb +21 -0
- data/lib/uniword/drawingml/offset.rb +24 -0
- data/lib/uniword/drawingml/outer_shadow.rb +38 -0
- data/lib/uniword/drawingml/path_gradient.rb +24 -0
- data/lib/uniword/drawingml/path_list.rb +22 -0
- data/lib/uniword/drawingml/pattern_fill.rb +26 -0
- data/lib/uniword/drawingml/picture_locking.rb +35 -0
- data/lib/uniword/drawingml/preset_dash.rb +22 -0
- data/lib/uniword/drawingml/preset_geometry.rb +24 -0
- data/lib/uniword/drawingml/preset_shadow.rb +26 -0
- data/lib/uniword/drawingml/red.rb +22 -0
- data/lib/uniword/drawingml/red_modulation.rb +22 -0
- data/lib/uniword/drawingml/red_offset.rb +22 -0
- data/lib/uniword/drawingml/reflection.rb +36 -0
- data/lib/uniword/drawingml/relative_rect.rb +27 -0
- data/lib/uniword/drawingml/rotation.rb +26 -0
- data/lib/uniword/drawingml/saturation.rb +22 -0
- data/lib/uniword/drawingml/saturation_modulation.rb +22 -0
- data/lib/uniword/drawingml/saturation_offset.rb +22 -0
- data/lib/uniword/drawingml/scene_3d.rb +24 -0
- data/lib/uniword/drawingml/scheme_color.rb +43 -0
- data/lib/uniword/drawingml/shade.rb +22 -0
- data/lib/uniword/drawingml/shape.rb +24 -0
- data/lib/uniword/drawingml/shape_3d.rb +28 -0
- data/lib/uniword/drawingml/shape_defaults.rb +27 -0
- data/lib/uniword/drawingml/shape_properties.rb +24 -0
- data/lib/uniword/drawingml/shape_style.rb +27 -0
- data/lib/uniword/drawingml/soft_edge.rb +22 -0
- data/lib/uniword/drawingml/solid_fill.rb +24 -0
- data/lib/uniword/drawingml/source_rect.rb +28 -0
- data/lib/uniword/drawingml/srgb_color.rb +43 -0
- data/lib/uniword/drawingml/stretch.rb +18 -0
- data/lib/uniword/drawingml/style_matrix.rb +27 -0
- data/lib/uniword/drawingml/style_matrix_reference.rb +25 -0
- data/lib/uniword/drawingml/style_reference.rb +23 -0
- data/lib/uniword/drawingml/text_body.rb +25 -0
- data/lib/uniword/drawingml/text_character_properties.rb +33 -0
- data/lib/uniword/drawingml/text_defaults.rb +27 -0
- data/lib/uniword/drawingml/text_font.rb +24 -0
- data/lib/uniword/drawingml/text_paragraph.rb +23 -0
- data/lib/uniword/drawingml/text_paragraph_properties.rb +26 -0
- data/lib/uniword/drawingml/text_run.rb +23 -0
- data/lib/uniword/drawingml/theme.rb +263 -0
- data/lib/uniword/drawingml/tile.rb +32 -0
- data/lib/uniword/drawingml/tile_rect.rb +28 -0
- data/lib/uniword/drawingml/tint.rb +22 -0
- data/lib/uniword/drawingml/transform2_d.rb +24 -0
- data/lib/uniword/drawingml.rb +190 -0
- data/lib/uniword/element.rb +52 -0
- data/lib/uniword/element_registry.rb +111 -0
- data/lib/uniword/endnote.rb +66 -0
- data/lib/uniword/errors.rb +140 -0
- data/lib/uniword/field.rb +76 -0
- data/lib/uniword/footer.rb +41 -0
- data/lib/uniword/footnote.rb +65 -0
- data/lib/uniword/format_converter.rb +350 -0
- data/lib/uniword/format_detector.rb +142 -0
- data/lib/uniword/glossary/auto_text.rb +24 -0
- data/lib/uniword/glossary/category_name.rb +22 -0
- data/lib/uniword/glossary/doc_part.rb +25 -0
- data/lib/uniword/glossary/doc_part_behavior.rb +22 -0
- data/lib/uniword/glossary/doc_part_behaviors.rb +23 -0
- data/lib/uniword/glossary/doc_part_body.rb +30 -0
- data/lib/uniword/glossary/doc_part_category.rb +25 -0
- data/lib/uniword/glossary/doc_part_description.rb +22 -0
- data/lib/uniword/glossary/doc_part_gallery.rb +22 -0
- data/lib/uniword/glossary/doc_part_id.rb +22 -0
- data/lib/uniword/glossary/doc_part_name.rb +22 -0
- data/lib/uniword/glossary/doc_part_properties.rb +35 -0
- data/lib/uniword/glossary/doc_part_type.rb +22 -0
- data/lib/uniword/glossary/doc_part_types.rb +25 -0
- data/lib/uniword/glossary/doc_parts.rb +22 -0
- data/lib/uniword/glossary/equation.rb +24 -0
- data/lib/uniword/glossary/glossary_document.rb +32 -0
- data/lib/uniword/glossary/style_id.rb +22 -0
- data/lib/uniword/glossary/text_box.rb +24 -0
- data/lib/uniword/glossary.rb +33 -0
- data/lib/uniword/header.rb +41 -0
- data/lib/uniword/html_importer.rb +55 -0
- data/lib/uniword/hyperlink.rb +76 -0
- data/lib/uniword/image.rb +244 -0
- data/lib/uniword/infrastructure/mime_packager.rb +155 -0
- data/lib/uniword/infrastructure/mime_parser.rb +195 -0
- data/lib/uniword/infrastructure/xml_namespace_normalizer.rb +105 -0
- data/lib/uniword/infrastructure/zip_extractor.rb +133 -0
- data/lib/uniword/infrastructure/zip_packager.rb +249 -0
- data/lib/uniword/infrastructure.rb +10 -0
- data/lib/uniword/lazy_loader.rb +118 -0
- data/lib/uniword/line_numbering.rb +129 -0
- data/lib/uniword/loggable.rb +57 -0
- data/lib/uniword/logger.rb +75 -0
- data/lib/uniword/math/accent.rb +25 -0
- data/lib/uniword/math/accent_properties.rb +25 -0
- data/lib/uniword/math/argument_properties.rb +22 -0
- data/lib/uniword/math/bar.rb +25 -0
- data/lib/uniword/math/bar_properties.rb +25 -0
- data/lib/uniword/math/begin_char.rb +22 -0
- data/lib/uniword/math/border_box.rb +25 -0
- data/lib/uniword/math/border_box_properties.rb +39 -0
- data/lib/uniword/math/box.rb +25 -0
- data/lib/uniword/math/box_properties.rb +33 -0
- data/lib/uniword/math/char.rb +22 -0
- data/lib/uniword/math/control_properties.rb +27 -0
- data/lib/uniword/math/degree.rb +26 -0
- data/lib/uniword/math/delimiter.rb +25 -0
- data/lib/uniword/math/delimiter_properties.rb +33 -0
- data/lib/uniword/math/denominator.rb +26 -0
- data/lib/uniword/math/element.rb +56 -0
- data/lib/uniword/math/end_char.rb +22 -0
- data/lib/uniword/math/equation_array.rb +25 -0
- data/lib/uniword/math/equation_array_properties.rb +33 -0
- data/lib/uniword/math/fraction.rb +27 -0
- data/lib/uniword/math/fraction_properties.rb +25 -0
- data/lib/uniword/math/function.rb +27 -0
- data/lib/uniword/math/function_name.rb +26 -0
- data/lib/uniword/math/function_properties.rb +23 -0
- data/lib/uniword/math/group_char.rb +25 -0
- data/lib/uniword/math/group_char_properties.rb +29 -0
- data/lib/uniword/math/lim.rb +26 -0
- data/lib/uniword/math/lower_limit.rb +27 -0
- data/lib/uniword/math/lower_limit_properties.rb +23 -0
- data/lib/uniword/math/math_break.rb +22 -0
- data/lib/uniword/math/math_font.rb +22 -0
- data/lib/uniword/math/math_properties.rb +53 -0
- data/lib/uniword/math/math_run.rb +42 -0
- data/lib/uniword/math/math_run_properties.rb +37 -0
- data/lib/uniword/math/math_simple_int_val.rb +24 -0
- data/lib/uniword/math/math_simple_val.rb +24 -0
- data/lib/uniword/math/math_style.rb +22 -0
- data/lib/uniword/math/math_text.rb +23 -0
- data/lib/uniword/math/matrix.rb +25 -0
- data/lib/uniword/math/matrix_column.rb +23 -0
- data/lib/uniword/math/matrix_column_properties.rb +24 -0
- data/lib/uniword/math/matrix_columns.rb +23 -0
- data/lib/uniword/math/matrix_properties.rb +37 -0
- data/lib/uniword/math/matrix_row.rb +23 -0
- data/lib/uniword/math/nary.rb +29 -0
- data/lib/uniword/math/nary_properties.rb +33 -0
- data/lib/uniword/math/numerator.rb +26 -0
- data/lib/uniword/math/o_math.rb +54 -0
- data/lib/uniword/math/o_math_para.rb +25 -0
- data/lib/uniword/math/o_math_para_properties.rb +22 -0
- data/lib/uniword/math/phantom.rb +25 -0
- data/lib/uniword/math/phantom_properties.rb +33 -0
- data/lib/uniword/math/plurimath_adapter.rb +289 -0
- data/lib/uniword/math/pre_sub_superscript.rb +29 -0
- data/lib/uniword/math/pre_sub_superscript_properties.rb +23 -0
- data/lib/uniword/math/radical.rb +27 -0
- data/lib/uniword/math/radical_properties.rb +25 -0
- data/lib/uniword/math/separator_char.rb +22 -0
- data/lib/uniword/math/sub.rb +26 -0
- data/lib/uniword/math/sub_superscript.rb +29 -0
- data/lib/uniword/math/sub_superscript_properties.rb +25 -0
- data/lib/uniword/math/subscript.rb +27 -0
- data/lib/uniword/math/subscript_properties.rb +23 -0
- data/lib/uniword/math/sup.rb +26 -0
- data/lib/uniword/math/superscript.rb +27 -0
- data/lib/uniword/math/superscript_properties.rb +23 -0
- data/lib/uniword/math/upper_limit.rb +27 -0
- data/lib/uniword/math/upper_limit_properties.rb +23 -0
- data/lib/uniword/math.rb +90 -0
- data/lib/uniword/math_equation.rb +158 -0
- data/lib/uniword/metadata/metadata.rb +345 -0
- data/lib/uniword/metadata/metadata_extractor.rb +403 -0
- data/lib/uniword/metadata/metadata_index.rb +455 -0
- data/lib/uniword/metadata/metadata_manager.rb +334 -0
- data/lib/uniword/metadata/metadata_updater.rb +243 -0
- data/lib/uniword/metadata/metadata_validator.rb +326 -0
- data/lib/uniword/metadata.rb +12 -0
- data/lib/uniword/mhtml/css_number_formatter.rb +127 -0
- data/lib/uniword/mhtml/document.rb +160 -0
- data/lib/uniword/mhtml/header_footer_part.rb +12 -0
- data/lib/uniword/mhtml/html_part.rb +108 -0
- data/lib/uniword/mhtml/image_part.rb +29 -0
- data/lib/uniword/mhtml/math_converter.rb +153 -0
- data/lib/uniword/mhtml/metadata/document_properties.rb +65 -0
- data/lib/uniword/mhtml/metadata/latent_styles.rb +33 -0
- data/lib/uniword/mhtml/metadata/office_document_settings.rb +22 -0
- data/lib/uniword/mhtml/metadata/word_document_settings.rb +47 -0
- data/lib/uniword/mhtml/metadata.rb +12 -0
- data/lib/uniword/mhtml/mhtml_package.rb +67 -0
- data/lib/uniword/mhtml/mime_part.rb +68 -0
- data/lib/uniword/mhtml/namespaces.rb +31 -0
- data/lib/uniword/mhtml/numbering_configuration.rb +49 -0
- data/lib/uniword/mhtml/styles_configuration.rb +57 -0
- data/lib/uniword/mhtml/theme.rb +50 -0
- data/lib/uniword/mhtml/theme_part.rb +19 -0
- data/lib/uniword/mhtml/word_css.rb +220 -0
- data/lib/uniword/mhtml/wordstyle.css +998 -0
- data/lib/uniword/mhtml/xml_part.rb +18 -0
- data/lib/uniword/mhtml.rb +31 -0
- data/lib/uniword/office/bottom.rb +22 -0
- data/lib/uniword/office/brightness.rb +22 -0
- data/lib/uniword/office/button.rb +26 -0
- data/lib/uniword/office/callout.rb +36 -0
- data/lib/uniword/office/callout_anchor.rb +22 -0
- data/lib/uniword/office/checkbox.rb +24 -0
- data/lib/uniword/office/color_menu.rb +24 -0
- data/lib/uniword/office/color_mru.rb +24 -0
- data/lib/uniword/office/complex.rb +22 -0
- data/lib/uniword/office/diagram.rb +36 -0
- data/lib/uniword/office/diffusity.rb +22 -0
- data/lib/uniword/office/document_protection.rb +26 -0
- data/lib/uniword/office/document_view.rb +22 -0
- data/lib/uniword/office/edge.rb +24 -0
- data/lib/uniword/office/extrusion.rb +54 -0
- data/lib/uniword/office/extrusion_color.rb +24 -0
- data/lib/uniword/office/extrusion_color_mode.rb +22 -0
- data/lib/uniword/office/extrusion_ok.rb +22 -0
- data/lib/uniword/office/field.rb +24 -0
- data/lib/uniword/office/forms.rb +22 -0
- data/lib/uniword/office/id_map.rb +24 -0
- data/lib/uniword/office/ink.rb +24 -0
- data/lib/uniword/office/ink_annotation.rb +24 -0
- data/lib/uniword/office/left.rb +22 -0
- data/lib/uniword/office/lock.rb +30 -0
- data/lib/uniword/office/metal.rb +22 -0
- data/lib/uniword/office/proof_state.rb +24 -0
- data/lib/uniword/office/regroup.rb +22 -0
- data/lib/uniword/office/regroup_table.rb +22 -0
- data/lib/uniword/office/relation_table.rb +22 -0
- data/lib/uniword/office/right.rb +22 -0
- data/lib/uniword/office/rules.rb +22 -0
- data/lib/uniword/office/shape_defaults.rb +29 -0
- data/lib/uniword/office/shape_layout.rb +25 -0
- data/lib/uniword/office/signature_line.rb +40 -0
- data/lib/uniword/office/skew.rb +28 -0
- data/lib/uniword/office/specularity.rb +22 -0
- data/lib/uniword/office/top.rb +22 -0
- data/lib/uniword/office/writing_style.rb +28 -0
- data/lib/uniword/office/zoom.rb +22 -0
- data/lib/uniword/office.rb +57 -0
- data/lib/uniword/ooxml/additional_characteristics.rb +43 -0
- data/lib/uniword/ooxml/app_properties.rb +130 -0
- data/lib/uniword/ooxml/core_properties.rb +69 -0
- data/lib/uniword/ooxml/custom_properties.rb +132 -0
- data/lib/uniword/ooxml/docx_package.rb +989 -0
- data/lib/uniword/ooxml/dotx_package.rb +247 -0
- data/lib/uniword/ooxml/namespaces.rb +363 -0
- data/lib/uniword/ooxml/package_file.rb +227 -0
- data/lib/uniword/ooxml/relationships/hyperlink_relationship.rb +24 -0
- data/lib/uniword/ooxml/relationships/image_relationship.rb +22 -0
- data/lib/uniword/ooxml/relationships/office_document_relationship.rb +24 -0
- data/lib/uniword/ooxml/relationships/package_relationship.rb +29 -0
- data/lib/uniword/ooxml/relationships/package_relationships.rb +51 -0
- data/lib/uniword/ooxml/relationships/relationship.rb +30 -0
- data/lib/uniword/ooxml/relationships/relationships.rb +43 -0
- data/lib/uniword/ooxml/relationships.rb +24 -0
- data/lib/uniword/ooxml/schema/attribute_definition.rb +159 -0
- data/lib/uniword/ooxml/schema/child_definition.rb +125 -0
- data/lib/uniword/ooxml/schema/element_definition.rb +155 -0
- data/lib/uniword/ooxml/schema/element_serializer.rb +319 -0
- data/lib/uniword/ooxml/schema/ooxml_schema.rb +226 -0
- data/lib/uniword/ooxml/schema.rb +16 -0
- data/lib/uniword/ooxml/schema_library.rb +38 -0
- data/lib/uniword/ooxml/styleset_package.rb +122 -0
- data/lib/uniword/ooxml/theme_package.rb +222 -0
- data/lib/uniword/ooxml/thmx_package.rb +127 -0
- data/lib/uniword/ooxml/types/cp_description_type.rb +17 -0
- data/lib/uniword/ooxml/types/cp_keywords_type.rb +17 -0
- data/lib/uniword/ooxml/types/cp_last_modified_by_type.rb +17 -0
- data/lib/uniword/ooxml/types/cp_revision_type.rb +17 -0
- data/lib/uniword/ooxml/types/dc_creator_type.rb +17 -0
- data/lib/uniword/ooxml/types/dc_subject_type.rb +17 -0
- data/lib/uniword/ooxml/types/dc_title_type.rb +17 -0
- data/lib/uniword/ooxml/types/dcterms_created_type.rb +24 -0
- data/lib/uniword/ooxml/types/dcterms_modified_type.rb +24 -0
- data/lib/uniword/ooxml/types/dcterms_w3cdtf_type.rb +49 -0
- data/lib/uniword/ooxml/types/mc_ignorable_type.rb +18 -0
- data/lib/uniword/ooxml/types/on_off_type.rb +64 -0
- data/lib/uniword/ooxml/types/ooxml_boolean.rb +49 -0
- data/lib/uniword/ooxml/types/ooxml_boolean_optional.rb +57 -0
- data/lib/uniword/ooxml/types/variant_types.rb +308 -0
- data/lib/uniword/ooxml/types.rb +76 -0
- data/lib/uniword/ooxml.rb +40 -0
- data/lib/uniword/page_borders.rb +117 -0
- data/lib/uniword/paragraph_border.rb +113 -0
- data/lib/uniword/picture/fill_rect.rb +28 -0
- data/lib/uniword/picture/non_visual_picture_drawing_properties.rb +25 -0
- data/lib/uniword/picture/non_visual_picture_properties.rb +25 -0
- data/lib/uniword/picture/picture.rb +27 -0
- data/lib/uniword/picture/picture_blip_fill.rb +27 -0
- data/lib/uniword/picture/picture_locks.rb +24 -0
- data/lib/uniword/picture/picture_shape_properties.rb +27 -0
- data/lib/uniword/picture/picture_source_rect.rb +28 -0
- data/lib/uniword/picture/picture_stretch.rb +23 -0
- data/lib/uniword/picture/tile.rb +30 -0
- data/lib/uniword/picture.rb +25 -0
- data/lib/uniword/presentationml/audio.rb +26 -0
- data/lib/uniword/presentationml/body_properties.rb +30 -0
- data/lib/uniword/presentationml/break.rb +22 -0
- data/lib/uniword/presentationml/color_map.rb +28 -0
- data/lib/uniword/presentationml/common_slide_data.rb +27 -0
- data/lib/uniword/presentationml/common_time_node.rb +33 -0
- data/lib/uniword/presentationml/connection_shape.rb +25 -0
- data/lib/uniword/presentationml/embed.rb +22 -0
- data/lib/uniword/presentationml/embedded_font.rb +24 -0
- data/lib/uniword/presentationml/end_conditions_list.rb +23 -0
- data/lib/uniword/presentationml/end_paragraph_run_properties.rb +26 -0
- data/lib/uniword/presentationml/extension.rb +22 -0
- data/lib/uniword/presentationml/extension_list.rb +23 -0
- data/lib/uniword/presentationml/field.rb +31 -0
- data/lib/uniword/presentationml/graphic_frame.rb +27 -0
- data/lib/uniword/presentationml/group_shape.rb +29 -0
- data/lib/uniword/presentationml/handout_master.rb +25 -0
- data/lib/uniword/presentationml/handout_master_id_list.rb +22 -0
- data/lib/uniword/presentationml/list_style.rb +29 -0
- data/lib/uniword/presentationml/non_visual_shape_properties.rb +27 -0
- data/lib/uniword/presentationml/notes.rb +27 -0
- data/lib/uniword/presentationml/notes_master_id_list.rb +22 -0
- data/lib/uniword/presentationml/notes_size.rb +24 -0
- data/lib/uniword/presentationml/ole_object.rb +26 -0
- data/lib/uniword/presentationml/paragraph.rb +31 -0
- data/lib/uniword/presentationml/paragraph_properties.rb +30 -0
- data/lib/uniword/presentationml/parallel_time_node.rb +23 -0
- data/lib/uniword/presentationml/picture.rb +27 -0
- data/lib/uniword/presentationml/presentation.rb +39 -0
- data/lib/uniword/presentationml/run.rb +25 -0
- data/lib/uniword/presentationml/run_properties.rb +34 -0
- data/lib/uniword/presentationml/sequence_time_node.rb +27 -0
- data/lib/uniword/presentationml/shape.rb +27 -0
- data/lib/uniword/presentationml/shape_properties.rb +31 -0
- data/lib/uniword/presentationml/shape_tree.rb +35 -0
- data/lib/uniword/presentationml/slide.rb +33 -0
- data/lib/uniword/presentationml/slide_id.rb +24 -0
- data/lib/uniword/presentationml/slide_id_list.rb +23 -0
- data/lib/uniword/presentationml/slide_layout.rb +33 -0
- data/lib/uniword/presentationml/slide_master.rb +33 -0
- data/lib/uniword/presentationml/slide_master_id.rb +24 -0
- data/lib/uniword/presentationml/slide_master_id_list.rb +23 -0
- data/lib/uniword/presentationml/slide_size.rb +26 -0
- data/lib/uniword/presentationml/start_conditions_list.rb +23 -0
- data/lib/uniword/presentationml/text_body.rb +27 -0
- data/lib/uniword/presentationml/time_node_list.rb +25 -0
- data/lib/uniword/presentationml/timing.rb +25 -0
- data/lib/uniword/presentationml/transition.rb +33 -0
- data/lib/uniword/presentationml/video.rb +24 -0
- data/lib/uniword/presentationml.rb +67 -0
- data/lib/uniword/properties/alignment.rb +26 -0
- data/lib/uniword/properties/bold.rb +40 -0
- data/lib/uniword/properties/boolean_formatting.rb +214 -0
- data/lib/uniword/properties/border.rb +48 -0
- data/lib/uniword/properties/borders.rb +39 -0
- data/lib/uniword/properties/cell_vertical_align.rb +32 -0
- data/lib/uniword/properties/cell_width.rb +28 -0
- data/lib/uniword/properties/character_spacing.rb +34 -0
- data/lib/uniword/properties/color_value.rb +57 -0
- data/lib/uniword/properties/contextual_spacing.rb +32 -0
- data/lib/uniword/properties/emphasis_mark.rb +35 -0
- data/lib/uniword/properties/font_size.rb +26 -0
- data/lib/uniword/properties/highlight.rb +28 -0
- data/lib/uniword/properties/indentation.rb +28 -0
- data/lib/uniword/properties/italic.rb +40 -0
- data/lib/uniword/properties/kerning.rb +34 -0
- data/lib/uniword/properties/language.rb +39 -0
- data/lib/uniword/properties/margin.rb +22 -0
- data/lib/uniword/properties/numbering_id.rb +26 -0
- data/lib/uniword/properties/numbering_level.rb +26 -0
- data/lib/uniword/properties/numbering_properties.rb +25 -0
- data/lib/uniword/properties/outline.rb +33 -0
- data/lib/uniword/properties/outline_level.rb +26 -0
- data/lib/uniword/properties/position.rb +33 -0
- data/lib/uniword/properties/run_fonts.rb +38 -0
- data/lib/uniword/properties/shading.rb +41 -0
- data/lib/uniword/properties/spacing.rb +28 -0
- data/lib/uniword/properties/style_reference.rb +81 -0
- data/lib/uniword/properties/tab_stop.rb +45 -0
- data/lib/uniword/properties/table_cell_margin.rb +33 -0
- data/lib/uniword/properties/table_indent.rb +23 -0
- data/lib/uniword/properties/table_justification.rb +22 -0
- data/lib/uniword/properties/table_look.rb +36 -0
- data/lib/uniword/properties/table_width.rb +28 -0
- data/lib/uniword/properties/tabs.rb +64 -0
- data/lib/uniword/properties/text_fill.rb +38 -0
- data/lib/uniword/properties/text_outline.rb +34 -0
- data/lib/uniword/properties/underline.rb +32 -0
- data/lib/uniword/properties/vertical_align.rb +26 -0
- data/lib/uniword/properties/width_scale.rb +34 -0
- data/lib/uniword/properties.rb +71 -0
- data/lib/uniword/quality/document_checker.rb +150 -0
- data/lib/uniword/quality/quality_report.rb +317 -0
- data/lib/uniword/quality/quality_rule.rb +153 -0
- data/lib/uniword/quality/rules/heading_hierarchy_rule.rb +83 -0
- data/lib/uniword/quality/rules/image_alt_text_rule.rb +87 -0
- data/lib/uniword/quality/rules/link_validation_rule.rb +136 -0
- data/lib/uniword/quality/rules/paragraph_length_rule.rb +77 -0
- data/lib/uniword/quality/rules/style_consistency_rule.rb +116 -0
- data/lib/uniword/quality/rules/table_header_rule.rb +69 -0
- data/lib/uniword/quality.rb +16 -0
- data/lib/uniword/resource/cache.rb +82 -0
- data/lib/uniword/resource/cache_paths.rb +29 -0
- data/lib/uniword/resource/cache_version.rb +49 -0
- data/lib/uniword/resource/color_transformer.rb +134 -0
- data/lib/uniword/resource/font_substitutor.rb +60 -0
- data/lib/uniword/resource/importer.rb +114 -0
- data/lib/uniword/resource/resource_location.rb +35 -0
- data/lib/uniword/resource/resource_resolver.rb +100 -0
- data/lib/uniword/resource/theme_processor.rb +107 -0
- data/lib/uniword/resource.rb +19 -0
- data/lib/uniword/revision.rb +200 -0
- data/lib/uniword/schema/model_generator.rb +182 -0
- data/lib/uniword/schema/schema_loader.rb +90 -0
- data/lib/uniword/schema.rb +8 -0
- data/lib/uniword/section.rb +183 -0
- data/lib/uniword/section_properties.rb +180 -0
- data/lib/uniword/serialization/ooxml_serializer.rb +30 -0
- data/lib/uniword/shading.rb +109 -0
- data/lib/uniword/shared_types/angle.rb +22 -0
- data/lib/uniword/shared_types/boolean_value.rb +24 -0
- data/lib/uniword/shared_types/decimal_number.rb +22 -0
- data/lib/uniword/shared_types/emu_measure.rb +22 -0
- data/lib/uniword/shared_types/fixed_percentage.rb +22 -0
- data/lib/uniword/shared_types/hex_color.rb +22 -0
- data/lib/uniword/shared_types/on_off.rb +24 -0
- data/lib/uniword/shared_types/percent_value.rb +22 -0
- data/lib/uniword/shared_types/pixel_measure.rb +22 -0
- data/lib/uniword/shared_types/point_measure.rb +22 -0
- data/lib/uniword/shared_types/positive_percentage.rb +22 -0
- data/lib/uniword/shared_types/string_type.rb +22 -0
- data/lib/uniword/shared_types/text_alignment.rb +22 -0
- data/lib/uniword/shared_types/twips_measure.rb +22 -0
- data/lib/uniword/shared_types/vertical_alignment.rb +22 -0
- data/lib/uniword/shared_types.rb +31 -0
- data/lib/uniword/spreadsheetml/alignment.rb +32 -0
- data/lib/uniword/spreadsheetml/authors.rb +23 -0
- data/lib/uniword/spreadsheetml/auto_filter.rb +25 -0
- data/lib/uniword/spreadsheetml/bold.rb +22 -0
- data/lib/uniword/spreadsheetml/book_views.rb +23 -0
- data/lib/uniword/spreadsheetml/border.rb +31 -0
- data/lib/uniword/spreadsheetml/borders.rb +25 -0
- data/lib/uniword/spreadsheetml/calc_properties.rb +26 -0
- data/lib/uniword/spreadsheetml/cell.rb +31 -0
- data/lib/uniword/spreadsheetml/cell_format.rb +41 -0
- data/lib/uniword/spreadsheetml/cell_formats.rb +25 -0
- data/lib/uniword/spreadsheetml/cell_formula.rb +28 -0
- data/lib/uniword/spreadsheetml/cell_style.rb +31 -0
- data/lib/uniword/spreadsheetml/cell_style_xfs.rb +23 -0
- data/lib/uniword/spreadsheetml/cell_styles.rb +23 -0
- data/lib/uniword/spreadsheetml/cell_value.rb +22 -0
- data/lib/uniword/spreadsheetml/chartsheet.rb +25 -0
- data/lib/uniword/spreadsheetml/col.rb +32 -0
- data/lib/uniword/spreadsheetml/col_breaks.rb +25 -0
- data/lib/uniword/spreadsheetml/color.rb +28 -0
- data/lib/uniword/spreadsheetml/color_filter.rb +23 -0
- data/lib/uniword/spreadsheetml/colors.rb +21 -0
- data/lib/uniword/spreadsheetml/cols.rb +23 -0
- data/lib/uniword/spreadsheetml/comment.rb +27 -0
- data/lib/uniword/spreadsheetml/comment_list.rb +23 -0
- data/lib/uniword/spreadsheetml/comments.rb +25 -0
- data/lib/uniword/spreadsheetml/conditional_formatting.rb +25 -0
- data/lib/uniword/spreadsheetml/conditional_formatting_rule.rb +27 -0
- data/lib/uniword/spreadsheetml/custom_filter.rb +23 -0
- data/lib/uniword/spreadsheetml/custom_filters.rb +23 -0
- data/lib/uniword/spreadsheetml/custom_workbook_views.rb +23 -0
- data/lib/uniword/spreadsheetml/data_validation.rb +43 -0
- data/lib/uniword/spreadsheetml/data_validations.rb +25 -0
- data/lib/uniword/spreadsheetml/date_group_item.rb +33 -0
- data/lib/uniword/spreadsheetml/defined_name.rb +28 -0
- data/lib/uniword/spreadsheetml/defined_names.rb +23 -0
- data/lib/uniword/spreadsheetml/dimension.rb +22 -0
- data/lib/uniword/spreadsheetml/drawing.rb +22 -0
- data/lib/uniword/spreadsheetml/dynamic_filter.rb +25 -0
- data/lib/uniword/spreadsheetml/external_reference.rb +21 -0
- data/lib/uniword/spreadsheetml/external_references.rb +23 -0
- data/lib/uniword/spreadsheetml/file_sharing.rb +22 -0
- data/lib/uniword/spreadsheetml/file_version.rb +24 -0
- data/lib/uniword/spreadsheetml/fill.rb +23 -0
- data/lib/uniword/spreadsheetml/fills.rb +25 -0
- data/lib/uniword/spreadsheetml/filter.rb +21 -0
- data/lib/uniword/spreadsheetml/filter_column.rb +37 -0
- data/lib/uniword/spreadsheetml/filters.rb +27 -0
- data/lib/uniword/spreadsheetml/font.rb +31 -0
- data/lib/uniword/spreadsheetml/font_name.rb +22 -0
- data/lib/uniword/spreadsheetml/font_size.rb +22 -0
- data/lib/uniword/spreadsheetml/fonts.rb +25 -0
- data/lib/uniword/spreadsheetml/hyperlink.rb +30 -0
- data/lib/uniword/spreadsheetml/hyperlinks.rb +23 -0
- data/lib/uniword/spreadsheetml/icon_filter.rb +23 -0
- data/lib/uniword/spreadsheetml/italic.rb +22 -0
- data/lib/uniword/spreadsheetml/legacy_drawing.rb +22 -0
- data/lib/uniword/spreadsheetml/merge_cell.rb +22 -0
- data/lib/uniword/spreadsheetml/merge_cells.rb +25 -0
- data/lib/uniword/spreadsheetml/number_format.rb +24 -0
- data/lib/uniword/spreadsheetml/number_formats.rb +25 -0
- data/lib/uniword/spreadsheetml/ole_object.rb +24 -0
- data/lib/uniword/spreadsheetml/ole_objects.rb +23 -0
- data/lib/uniword/spreadsheetml/ole_size.rb +21 -0
- data/lib/uniword/spreadsheetml/pattern_fill.rb +27 -0
- data/lib/uniword/spreadsheetml/phonetic_pr.rb +35 -0
- data/lib/uniword/spreadsheetml/phonetic_properties.rb +24 -0
- data/lib/uniword/spreadsheetml/pivot_caches.rb +23 -0
- data/lib/uniword/spreadsheetml/pivot_table.rb +24 -0
- data/lib/uniword/spreadsheetml/pivot_table_definition.rb +26 -0
- data/lib/uniword/spreadsheetml/protected_ranges.rb +23 -0
- data/lib/uniword/spreadsheetml/query_table.rb +24 -0
- data/lib/uniword/spreadsheetml/rich_text_run.rb +25 -0
- data/lib/uniword/spreadsheetml/row.rb +33 -0
- data/lib/uniword/spreadsheetml/row_breaks.rb +25 -0
- data/lib/uniword/spreadsheetml/run_properties.rb +29 -0
- data/lib/uniword/spreadsheetml/scenarios.rb +27 -0
- data/lib/uniword/spreadsheetml/shared_string_table.rb +27 -0
- data/lib/uniword/spreadsheetml/sheet.rb +28 -0
- data/lib/uniword/spreadsheetml/sheet_data.rb +23 -0
- data/lib/uniword/spreadsheetml/sheet_format_pr.rb +33 -0
- data/lib/uniword/spreadsheetml/sheet_protection.rb +28 -0
- data/lib/uniword/spreadsheetml/sheet_view.rb +30 -0
- data/lib/uniword/spreadsheetml/sheet_views.rb +23 -0
- data/lib/uniword/spreadsheetml/sheets.rb +23 -0
- data/lib/uniword/spreadsheetml/sort_condition.rb +33 -0
- data/lib/uniword/spreadsheetml/sort_state.rb +23 -0
- data/lib/uniword/spreadsheetml/sparkline_group.rb +24 -0
- data/lib/uniword/spreadsheetml/sparkline_groups.rb +23 -0
- data/lib/uniword/spreadsheetml/string_item.rb +27 -0
- data/lib/uniword/spreadsheetml/table.rb +35 -0
- data/lib/uniword/spreadsheetml/table_column.rb +24 -0
- data/lib/uniword/spreadsheetml/table_columns.rb +25 -0
- data/lib/uniword/spreadsheetml/table_formula.rb +23 -0
- data/lib/uniword/spreadsheetml/table_parts.rb +23 -0
- data/lib/uniword/spreadsheetml/table_style_info.rb +30 -0
- data/lib/uniword/spreadsheetml/table_styles.rb +23 -0
- data/lib/uniword/spreadsheetml/text.rb +24 -0
- data/lib/uniword/spreadsheetml/top10.rb +27 -0
- data/lib/uniword/spreadsheetml/workbook.rb +31 -0
- data/lib/uniword/spreadsheetml/workbook_properties.rb +26 -0
- data/lib/uniword/spreadsheetml/workbook_protection.rb +24 -0
- data/lib/uniword/spreadsheetml/workbook_view.rb +26 -0
- data/lib/uniword/spreadsheetml/worksheet/sheet_format_pr.rb +35 -0
- data/lib/uniword/spreadsheetml/worksheet.rb +33 -0
- data/lib/uniword/spreadsheetml.rb +121 -0
- data/lib/uniword/streaming_parser.rb +277 -0
- data/lib/uniword/styles.rb +14 -0
- data/lib/uniword/styleset.rb +166 -0
- data/lib/uniword/stylesets/package.rb +107 -0
- data/lib/uniword/stylesets/styleset_importer.rb +96 -0
- data/lib/uniword/stylesets/yaml_styleset_loader.rb +58 -0
- data/lib/uniword/stylesets.rb +9 -0
- data/lib/uniword/tab_stop.rb +85 -0
- data/lib/uniword/table_border.rb +87 -0
- data/lib/uniword/template/helpers/conditional_helper.rb +107 -0
- data/lib/uniword/template/helpers/filter_helper.rb +124 -0
- data/lib/uniword/template/helpers/loop_helper.rb +119 -0
- data/lib/uniword/template/helpers/variable_helper.rb +85 -0
- data/lib/uniword/template/helpers.rb +12 -0
- data/lib/uniword/template/template.rb +147 -0
- data/lib/uniword/template/template_context.rb +103 -0
- data/lib/uniword/template/template_marker.rb +121 -0
- data/lib/uniword/template/template_parser.rb +186 -0
- data/lib/uniword/template/template_renderer.rb +204 -0
- data/lib/uniword/template/template_validator.rb +202 -0
- data/lib/uniword/template/variable_resolver.rb +195 -0
- data/lib/uniword/template.rb +14 -0
- data/lib/uniword/text_box.rb +55 -0
- data/lib/uniword/text_frame.rb +168 -0
- data/lib/uniword/theme/media_file.rb +128 -0
- data/lib/uniword/theme/theme_applicator.rb +141 -0
- data/lib/uniword/theme/theme_loader.rb +107 -0
- data/lib/uniword/theme/theme_package_reader.rb +102 -0
- data/lib/uniword/theme/theme_variant.rb +87 -0
- data/lib/uniword/theme/theme_xml_parser.rb +239 -0
- data/lib/uniword/theme_writer.rb +58 -0
- data/lib/uniword/themes/theme.rb +159 -0
- data/lib/uniword/themes/theme_importer.rb +138 -0
- data/lib/uniword/themes/theme_transformation.rb +202 -0
- data/lib/uniword/themes.rb +23 -0
- data/lib/uniword/tracked_changes.rb +231 -0
- data/lib/uniword/transformation/html_to_ooxml_converter.rb +541 -0
- data/lib/uniword/transformation/hyperlink_transformation_rule.rb +72 -0
- data/lib/uniword/transformation/image_transformation_rule.rb +69 -0
- data/lib/uniword/transformation/ooxml_to_html_converter.rb +172 -0
- data/lib/uniword/transformation/ooxml_to_mhtml_converter.rb +1406 -0
- data/lib/uniword/transformation/paragraph_transformation_rule.rb +166 -0
- data/lib/uniword/transformation/run_transformation_rule.rb +76 -0
- data/lib/uniword/transformation/table_transformation_rule.rb +120 -0
- data/lib/uniword/transformation/transformation_rule.rb +91 -0
- data/lib/uniword/transformation/transformation_rule_registry.rb +133 -0
- data/lib/uniword/transformation/transformer.rb +386 -0
- data/lib/uniword/transformation.rb +18 -0
- data/lib/uniword/validation/checkers/external_link_checker.rb +200 -0
- data/lib/uniword/validation/checkers/file_reference_checker.rb +196 -0
- data/lib/uniword/validation/checkers/footnote_reference_checker.rb +178 -0
- data/lib/uniword/validation/checkers/internal_link_checker.rb +181 -0
- data/lib/uniword/validation/checkers.rb +12 -0
- data/lib/uniword/validation/document_validator.rb +272 -0
- data/lib/uniword/validation/layer_validation_result.rb +157 -0
- data/lib/uniword/validation/layer_validator.rb +104 -0
- data/lib/uniword/validation/link_checker.rb +94 -0
- data/lib/uniword/validation/link_validator.rb +318 -0
- data/lib/uniword/validation/validation_report.rb +409 -0
- data/lib/uniword/validation/validation_result.rb +215 -0
- data/lib/uniword/validation/validators/content_type_validator.rb +159 -0
- data/lib/uniword/validation/validators/document_semantics_validator.rb +152 -0
- data/lib/uniword/validation/validators/file_structure_validator.rb +101 -0
- data/lib/uniword/validation/validators/ooxml_part_validator.rb +128 -0
- data/lib/uniword/validation/validators/relationship_validator.rb +146 -0
- data/lib/uniword/validation/validators/xml_schema_validator.rb +120 -0
- data/lib/uniword/validation/validators/zip_integrity_validator.rb +110 -0
- data/lib/uniword/validation/validators.rb +15 -0
- data/lib/uniword/validation.rb +15 -0
- data/lib/uniword/validators/element_validator.rb +97 -0
- data/lib/uniword/validators/paragraph_validator.rb +122 -0
- data/lib/uniword/validators/table_validator.rb +140 -0
- data/lib/uniword/validators.rb +9 -0
- data/lib/uniword/version.rb +5 -0
- data/lib/uniword/visitor/base_visitor.rb +81 -0
- data/lib/uniword/visitor/text_extractor.rb +119 -0
- data/lib/uniword/visitor.rb +8 -0
- data/lib/uniword/vml/arc.rb +41 -0
- data/lib/uniword/vml/background.rb +33 -0
- data/lib/uniword/vml/curve.rb +36 -0
- data/lib/uniword/vml/fill.rb +32 -0
- data/lib/uniword/vml/formula.rb +23 -0
- data/lib/uniword/vml/formulas.rb +24 -0
- data/lib/uniword/vml/group.rb +30 -0
- data/lib/uniword/vml/handle.rb +39 -0
- data/lib/uniword/vml/handles.rb +24 -0
- data/lib/uniword/vml/image.rb +47 -0
- data/lib/uniword/vml/imagedata.rb +34 -0
- data/lib/uniword/vml/line.rb +34 -0
- data/lib/uniword/vml/oval.rb +34 -0
- data/lib/uniword/vml/path.rb +28 -0
- data/lib/uniword/vml/polyline.rb +32 -0
- data/lib/uniword/vml/rect.rb +34 -0
- data/lib/uniword/vml/roundrect.rb +39 -0
- data/lib/uniword/vml/shadow.rb +33 -0
- data/lib/uniword/vml/shape.rb +73 -0
- data/lib/uniword/vml/shapetype.rb +32 -0
- data/lib/uniword/vml/stroke.rb +34 -0
- data/lib/uniword/vml/textbox.rb +28 -0
- data/lib/uniword/vml/textpath.rb +25 -0
- data/lib/uniword/vml/wrap.rb +24 -0
- data/lib/uniword/vml.rb +39 -0
- data/lib/uniword/vml_office/vml_anchor_lock.rb +22 -0
- data/lib/uniword/vml_office/vml_bottom.rb +24 -0
- data/lib/uniword/vml_office/vml_callout.rb +35 -0
- data/lib/uniword/vml_office/vml_clip_path.rb +24 -0
- data/lib/uniword/vml_office/vml_color_mru.rb +24 -0
- data/lib/uniword/vml_office/vml_column.rb +24 -0
- data/lib/uniword/vml_office/vml_complex.rb +22 -0
- data/lib/uniword/vml_office/vml_complex_extension.rb +24 -0
- data/lib/uniword/vml_office/vml_diagram.rb +32 -0
- data/lib/uniword/vml_office/vml_entry.rb +24 -0
- data/lib/uniword/vml_office/vml_extrusion.rb +43 -0
- data/lib/uniword/vml_office/vml_id_map.rb +24 -0
- data/lib/uniword/vml_office/vml_ink.rb +26 -0
- data/lib/uniword/vml_office/vml_left.rb +24 -0
- data/lib/uniword/vml_office/vml_lock.rb +37 -0
- data/lib/uniword/vml_office/vml_office_fill.rb +32 -0
- data/lib/uniword/vml_office/vml_proxy.rb +28 -0
- data/lib/uniword/vml_office/vml_regroup.rb +22 -0
- data/lib/uniword/vml_office/vml_relation_table.rb +24 -0
- data/lib/uniword/vml_office/vml_right.rb +24 -0
- data/lib/uniword/vml_office/vml_rule.rb +26 -0
- data/lib/uniword/vml_office/vml_rules.rb +24 -0
- data/lib/uniword/vml_office/vml_shape_defaults.rb +53 -0
- data/lib/uniword/vml_office/vml_shape_layout.rb +70 -0
- data/lib/uniword/vml_office/vml_signature_line.rb +38 -0
- data/lib/uniword/vml_office/vml_skew.rb +29 -0
- data/lib/uniword/vml_office/vml_top.rb +24 -0
- data/lib/uniword/vml_office/vml_wrap_block.rb +24 -0
- data/lib/uniword/vml_office/vml_wrap_coords.rb +22 -0
- data/lib/uniword/vml_office.rb +47 -0
- data/lib/uniword/vml_word/border_bottom.rb +29 -0
- data/lib/uniword/vml_word/border_left.rb +29 -0
- data/lib/uniword/vml_word/border_right.rb +29 -0
- data/lib/uniword/vml_word/border_top.rb +29 -0
- data/lib/uniword/vml_word.rb +17 -0
- data/lib/uniword/warnings/warning.rb +130 -0
- data/lib/uniword/warnings/warning_collector.rb +229 -0
- data/lib/uniword/warnings/warning_report.rb +159 -0
- data/lib/uniword/warnings.rb +9 -0
- data/lib/uniword/word2010_ext/wrap.rb +26 -0
- data/lib/uniword/word2010_ext.rb +14 -0
- data/lib/uniword/word_implementation.rb +58 -0
- data/lib/uniword/word_implementation_factory.rb +15 -0
- data/lib/uniword/word_implementation_linux.rb +42 -0
- data/lib/uniword/word_implementation_macos.rb +41 -0
- data/lib/uniword/word_implementation_null.rb +34 -0
- data/lib/uniword/word_implementation_windows.rb +75 -0
- data/lib/uniword/wordprocessing_group.rb +29 -0
- data/lib/uniword/wordprocessing_shape.rb +48 -0
- data/lib/uniword/wordprocessingml/abstract_num.rb +27 -0
- data/lib/uniword/wordprocessingml/abstract_num_id.rb +22 -0
- data/lib/uniword/wordprocessingml/alternate_content.rb +24 -0
- data/lib/uniword/wordprocessingml/anchor.rb +35 -0
- data/lib/uniword/wordprocessingml/based_on.rb +22 -0
- data/lib/uniword/wordprocessingml/body.rb +95 -0
- data/lib/uniword/wordprocessingml/bookmark_end.rb +22 -0
- data/lib/uniword/wordprocessingml/bookmark_start.rb +24 -0
- data/lib/uniword/wordprocessingml/border.rb +30 -0
- data/lib/uniword/wordprocessingml/break.rb +24 -0
- data/lib/uniword/wordprocessingml/carriage_return.rb +17 -0
- data/lib/uniword/wordprocessingml/character_style.rb +199 -0
- data/lib/uniword/wordprocessingml/choice.rb +24 -0
- data/lib/uniword/wordprocessingml/cnf_style.rb +52 -0
- data/lib/uniword/wordprocessingml/columns.rb +26 -0
- data/lib/uniword/wordprocessingml/comment_range_end.rb +22 -0
- data/lib/uniword/wordprocessingml/comment_range_start.rb +22 -0
- data/lib/uniword/wordprocessingml/comment_reference.rb +22 -0
- data/lib/uniword/wordprocessingml/compat.rb +35 -0
- data/lib/uniword/wordprocessingml/compat_setting.rb +26 -0
- data/lib/uniword/wordprocessingml/deleted_text.rb +29 -0
- data/lib/uniword/wordprocessingml/doc_defaults.rb +25 -0
- data/lib/uniword/wordprocessingml/doc_grid.rb +25 -0
- data/lib/uniword/wordprocessingml/doc_pr.rb +26 -0
- data/lib/uniword/wordprocessingml/document_root.rb +251 -0
- data/lib/uniword/wordprocessingml/drawing.rb +24 -0
- data/lib/uniword/wordprocessingml/emboss.rb +24 -0
- data/lib/uniword/wordprocessingml/endnote.rb +27 -0
- data/lib/uniword/wordprocessingml/endnote_ref.rb +20 -0
- data/lib/uniword/wordprocessingml/endnote_reference.rb +22 -0
- data/lib/uniword/wordprocessingml/endnotes.rb +23 -0
- data/lib/uniword/wordprocessingml/extent.rb +24 -0
- data/lib/uniword/wordprocessingml/fallback.rb +24 -0
- data/lib/uniword/wordprocessingml/field_char.rb +24 -0
- data/lib/uniword/wordprocessingml/font.rb +110 -0
- data/lib/uniword/wordprocessingml/font_table.rb +30 -0
- data/lib/uniword/wordprocessingml/fonts.rb +23 -0
- data/lib/uniword/wordprocessingml/footer.rb +25 -0
- data/lib/uniword/wordprocessingml/footer_reference.rb +27 -0
- data/lib/uniword/wordprocessingml/footnote.rb +27 -0
- data/lib/uniword/wordprocessingml/footnote_ref.rb +20 -0
- data/lib/uniword/wordprocessingml/footnote_reference.rb +22 -0
- data/lib/uniword/wordprocessingml/footnotes.rb +23 -0
- data/lib/uniword/wordprocessingml/graphic.rb +23 -0
- data/lib/uniword/wordprocessingml/graphic_data.rb +22 -0
- data/lib/uniword/wordprocessingml/grid_after.rb +17 -0
- data/lib/uniword/wordprocessingml/grid_before.rb +17 -0
- data/lib/uniword/wordprocessingml/grid_col.rb +22 -0
- data/lib/uniword/wordprocessingml/header.rb +25 -0
- data/lib/uniword/wordprocessingml/header_reference.rb +27 -0
- data/lib/uniword/wordprocessingml/hyperlink.rb +73 -0
- data/lib/uniword/wordprocessingml/imprint.rb +24 -0
- data/lib/uniword/wordprocessingml/inline.rb +27 -0
- data/lib/uniword/wordprocessingml/instr_text.rb +32 -0
- data/lib/uniword/wordprocessingml/last_rendered_page_break.rb +16 -0
- data/lib/uniword/wordprocessingml/latent_styles.rb +59 -0
- data/lib/uniword/wordprocessingml/level.rb +103 -0
- data/lib/uniword/wordprocessingml/link.rb +22 -0
- data/lib/uniword/wordprocessingml/lvl_jc.rb +22 -0
- data/lib/uniword/wordprocessingml/lvl_text.rb +22 -0
- data/lib/uniword/wordprocessingml/mc_requires.rb +11 -0
- data/lib/uniword/wordprocessingml/multi_level_type.rb +22 -0
- data/lib/uniword/wordprocessingml/next.rb +22 -0
- data/lib/uniword/wordprocessingml/no_break_hyphen.rb +17 -0
- data/lib/uniword/wordprocessingml/no_wrap.rb +16 -0
- data/lib/uniword/wordprocessingml/num.rb +25 -0
- data/lib/uniword/wordprocessingml/num_fmt.rb +22 -0
- data/lib/uniword/wordprocessingml/numbering.rb +25 -0
- data/lib/uniword/wordprocessingml/numbering_configuration.rb +173 -0
- data/lib/uniword/wordprocessingml/numbering_definition.rb +155 -0
- data/lib/uniword/wordprocessingml/numbering_elements.rb +78 -0
- data/lib/uniword/wordprocessingml/numbering_instance.rb +55 -0
- data/lib/uniword/wordprocessingml/numbering_level.rb +90 -0
- data/lib/uniword/wordprocessingml/object.rb +24 -0
- data/lib/uniword/wordprocessingml/outline.rb +24 -0
- data/lib/uniword/wordprocessingml/p_pr_default.rb +23 -0
- data/lib/uniword/wordprocessingml/page_margins.rb +34 -0
- data/lib/uniword/wordprocessingml/page_numbering.rb +24 -0
- data/lib/uniword/wordprocessingml/page_size.rb +26 -0
- data/lib/uniword/wordprocessingml/paragraph.rb +197 -0
- data/lib/uniword/wordprocessingml/paragraph_borders.rb +58 -0
- data/lib/uniword/wordprocessingml/paragraph_properties.rb +339 -0
- data/lib/uniword/wordprocessingml/paragraph_style.rb +163 -0
- data/lib/uniword/wordprocessingml/pict.rb +23 -0
- data/lib/uniword/wordprocessingml/picture.rb +27 -0
- data/lib/uniword/wordprocessingml/position_tab.rb +26 -0
- data/lib/uniword/wordprocessingml/proof_err.rb +20 -0
- data/lib/uniword/wordprocessingml/r_pr_default.rb +23 -0
- data/lib/uniword/wordprocessingml/recipient_data.rb +25 -0
- data/lib/uniword/wordprocessingml/recipients.rb +21 -0
- data/lib/uniword/wordprocessingml/run.rb +254 -0
- data/lib/uniword/wordprocessingml/run_properties.rb +701 -0
- data/lib/uniword/wordprocessingml/section_properties.rb +55 -0
- data/lib/uniword/wordprocessingml/semi_hidden.rb +27 -0
- data/lib/uniword/wordprocessingml/settings.rb +606 -0
- data/lib/uniword/wordprocessingml/shading.rb +30 -0
- data/lib/uniword/wordprocessingml/shadow.rb +24 -0
- data/lib/uniword/wordprocessingml/shape.rb +26 -0
- data/lib/uniword/wordprocessingml/simple_field.rb +27 -0
- data/lib/uniword/wordprocessingml/simple_pos.rb +24 -0
- data/lib/uniword/wordprocessingml/soft_hyphen.rb +17 -0
- data/lib/uniword/wordprocessingml/start.rb +22 -0
- data/lib/uniword/wordprocessingml/structured_document_tag/alias.rb +21 -0
- data/lib/uniword/wordprocessingml/structured_document_tag/appearance.rb +22 -0
- data/lib/uniword/wordprocessingml/structured_document_tag/bibliography.rb +18 -0
- data/lib/uniword/wordprocessingml/structured_document_tag/content.rb +32 -0
- data/lib/uniword/wordprocessingml/structured_document_tag/data_binding.rb +27 -0
- data/lib/uniword/wordprocessingml/structured_document_tag/date.rb +75 -0
- data/lib/uniword/wordprocessingml/structured_document_tag/doc_part_obj.rb +57 -0
- data/lib/uniword/wordprocessingml/structured_document_tag/end_properties.rb +24 -0
- data/lib/uniword/wordprocessingml/structured_document_tag/id.rb +21 -0
- data/lib/uniword/wordprocessingml/structured_document_tag/placeholder.rb +33 -0
- data/lib/uniword/wordprocessingml/structured_document_tag/run_properties.rb +83 -0
- data/lib/uniword/wordprocessingml/structured_document_tag/showing_placeholder_header.rb +18 -0
- data/lib/uniword/wordprocessingml/structured_document_tag/tag.rb +21 -0
- data/lib/uniword/wordprocessingml/structured_document_tag/temporary.rb +19 -0
- data/lib/uniword/wordprocessingml/structured_document_tag/text.rb +18 -0
- data/lib/uniword/wordprocessingml/structured_document_tag.rb +62 -0
- data/lib/uniword/wordprocessingml/structured_document_tag_properties.rb +53 -0
- data/lib/uniword/wordprocessingml/style.rb +383 -0
- data/lib/uniword/wordprocessingml/style_name.rb +45 -0
- data/lib/uniword/wordprocessingml/styles/character_style_definition.rb +45 -0
- data/lib/uniword/wordprocessingml/styles/list_style_definition.rb +74 -0
- data/lib/uniword/wordprocessingml/styles/paragraph_style_definition.rb +54 -0
- data/lib/uniword/wordprocessingml/styles/semantic_style.rb +58 -0
- data/lib/uniword/wordprocessingml/styles/style_definition.rb +61 -0
- data/lib/uniword/wordprocessingml/styles/style_library.rb +207 -0
- data/lib/uniword/wordprocessingml/styles/table_style_definition.rb +60 -0
- data/lib/uniword/wordprocessingml/styles.rb +13 -0
- data/lib/uniword/wordprocessingml/styles_configuration.rb +352 -0
- data/lib/uniword/wordprocessingml/symbol.rb +24 -0
- data/lib/uniword/wordprocessingml/tab.rb +23 -0
- data/lib/uniword/wordprocessingml/tab_stop.rb +58 -0
- data/lib/uniword/wordprocessingml/table.rb +72 -0
- data/lib/uniword/wordprocessingml/table_borders.rb +33 -0
- data/lib/uniword/wordprocessingml/table_cell.rb +80 -0
- data/lib/uniword/wordprocessingml/table_cell_borders.rb +29 -0
- data/lib/uniword/wordprocessingml/table_cell_margin.rb +29 -0
- data/lib/uniword/wordprocessingml/table_cell_properties.rb +60 -0
- data/lib/uniword/wordprocessingml/table_grid.rb +23 -0
- data/lib/uniword/wordprocessingml/table_properties.rb +352 -0
- data/lib/uniword/wordprocessingml/table_row.rb +79 -0
- data/lib/uniword/wordprocessingml/table_row_properties.rb +58 -0
- data/lib/uniword/wordprocessingml/table_style.rb +20 -0
- data/lib/uniword/wordprocessingml/text.rb +81 -0
- data/lib/uniword/wordprocessingml/text_box_content.rb +27 -0
- data/lib/uniword/wordprocessingml/text_direction.rb +19 -0
- data/lib/uniword/wordprocessingml/tr_height.rb +21 -0
- data/lib/uniword/wordprocessingml/ui_priority.rb +22 -0
- data/lib/uniword/wordprocessingml/val_int.rb +18 -0
- data/lib/uniword/wordprocessingml/w14_attributes.rb +47 -0
- data/lib/uniword/wordprocessingml/web_settings.rb +43 -0
- data/lib/uniword/wordprocessingml/width_after.rb +19 -0
- data/lib/uniword/wordprocessingml/width_before.rb +19 -0
- data/lib/uniword/wordprocessingml/zoom.rb +22 -0
- data/lib/uniword/wordprocessingml.rb +237 -0
- data/lib/uniword/wordprocessingml_2010/checkbox.rb +27 -0
- data/lib/uniword/wordprocessingml_2010/checked_state.rb +24 -0
- data/lib/uniword/wordprocessingml_2010/conditional_format_style.rb +30 -0
- data/lib/uniword/wordprocessingml_2010/conflict_deletion.rb +26 -0
- data/lib/uniword/wordprocessingml_2010/conflict_insertion.rb +26 -0
- data/lib/uniword/wordprocessingml_2010/conflict_mode.rb +22 -0
- data/lib/uniword/wordprocessingml_2010/custom_xml_conflict_insertion.rb +24 -0
- data/lib/uniword/wordprocessingml_2010/doc_id.rb +22 -0
- data/lib/uniword/wordprocessingml_2010/doc_part_gallery.rb +22 -0
- data/lib/uniword/wordprocessingml_2010/doc_part_obj.rb +27 -0
- data/lib/uniword/wordprocessingml_2010/entity_picker.rb +22 -0
- data/lib/uniword/wordprocessingml_2010/ligatures.rb +22 -0
- data/lib/uniword/wordprocessingml_2010/number_form.rb +22 -0
- data/lib/uniword/wordprocessingml_2010/para_id.rb +22 -0
- data/lib/uniword/wordprocessingml_2010/props3d.rb +26 -0
- data/lib/uniword/wordprocessingml_2010/sdt_content.rb +23 -0
- data/lib/uniword/wordprocessingml_2010/sdt_properties.rb +27 -0
- data/lib/uniword/wordprocessingml_2010/structured_document_tag.rb +25 -0
- data/lib/uniword/wordprocessingml_2010/text_fill.rb +27 -0
- data/lib/uniword/wordprocessingml_2010/text_glow.rb +25 -0
- data/lib/uniword/wordprocessingml_2010/text_id.rb +22 -0
- data/lib/uniword/wordprocessingml_2010/text_outline.rb +28 -0
- data/lib/uniword/wordprocessingml_2010/text_reflection.rb +28 -0
- data/lib/uniword/wordprocessingml_2010/text_shadow.rb +28 -0
- data/lib/uniword/wordprocessingml_2010/unchecked_state.rb +24 -0
- data/lib/uniword/wordprocessingml_2010.rb +44 -0
- data/lib/uniword/wordprocessingml_2013/chart_props.rb +25 -0
- data/lib/uniword/wordprocessingml_2013/chart_tracking_ref_based.rb +22 -0
- data/lib/uniword/wordprocessingml_2013/comment_author.rb +26 -0
- data/lib/uniword/wordprocessingml_2013/comment_collapsed.rb +22 -0
- data/lib/uniword/wordprocessingml_2013/comment_done.rb +22 -0
- data/lib/uniword/wordprocessingml_2013/comment_ex.rb +26 -0
- data/lib/uniword/wordprocessingml_2013/comments_ids.rb +23 -0
- data/lib/uniword/wordprocessingml_2013/doc_part_anchor.rb +22 -0
- data/lib/uniword/wordprocessingml_2013/document_part.rb +22 -0
- data/lib/uniword/wordprocessingml_2013/footnote_columns.rb +22 -0
- data/lib/uniword/wordprocessingml_2013/people_group.rb +25 -0
- data/lib/uniword/wordprocessingml_2013/person.rb +26 -0
- data/lib/uniword/wordprocessingml_2013/presence_info.rb +24 -0
- data/lib/uniword/wordprocessingml_2013/repeating_section.rb +25 -0
- data/lib/uniword/wordprocessingml_2013/repeating_section_item.rb +22 -0
- data/lib/uniword/wordprocessingml_2013/sdt_appearance.rb +22 -0
- data/lib/uniword/wordprocessingml_2013/sdt_color.rb +22 -0
- data/lib/uniword/wordprocessingml_2013/sdt_data_binding.rb +24 -0
- data/lib/uniword/wordprocessingml_2013/web_extension.rb +22 -0
- data/lib/uniword/wordprocessingml_2013/web_extension_linked.rb +22 -0
- data/lib/uniword/wordprocessingml_2013.rb +38 -0
- data/lib/uniword/wordprocessingml_2016/cell_rsid.rb +22 -0
- data/lib/uniword/wordprocessingml_2016/chart_color_style.rb +22 -0
- data/lib/uniword/wordprocessingml_2016/chart_style2016.rb +22 -0
- data/lib/uniword/wordprocessingml_2016/comments_ext.rb +24 -0
- data/lib/uniword/wordprocessingml_2016/conflict_mode2016.rb +22 -0
- data/lib/uniword/wordprocessingml_2016/content_id.rb +22 -0
- data/lib/uniword/wordprocessingml_2016/data_binding2016.rb +26 -0
- data/lib/uniword/wordprocessingml_2016/extension.rb +25 -0
- data/lib/uniword/wordprocessingml_2016/extension_list.rb +23 -0
- data/lib/uniword/wordprocessingml_2016/persistent_document_id.rb +22 -0
- data/lib/uniword/wordprocessingml_2016/row_rsid.rb +22 -0
- data/lib/uniword/wordprocessingml_2016/sdt_appearance2016.rb +22 -0
- data/lib/uniword/wordprocessingml_2016/separator_extension.rb +22 -0
- data/lib/uniword/wordprocessingml_2016/table_rsid.rb +22 -0
- data/lib/uniword/wordprocessingml_2016/web_video_property.rb +24 -0
- data/lib/uniword/wordprocessingml_2016.rb +33 -0
- data/lib/uniword/wp_drawing/align.rb +22 -0
- data/lib/uniword/wp_drawing/allow_overlap.rb +22 -0
- data/lib/uniword/wp_drawing/anchor.rb +80 -0
- data/lib/uniword/wp_drawing/behind_doc.rb +22 -0
- data/lib/uniword/wp_drawing/c_nv_graphic_frame_pr.rb +23 -0
- data/lib/uniword/wp_drawing/doc_pr.rb +30 -0
- data/lib/uniword/wp_drawing/doc_properties.rb +27 -0
- data/lib/uniword/wp_drawing/effect_extent.rb +28 -0
- data/lib/uniword/wp_drawing/extent.rb +24 -0
- data/lib/uniword/wp_drawing/hidden.rb +22 -0
- data/lib/uniword/wp_drawing/inline.rb +38 -0
- data/lib/uniword/wp_drawing/layout_in_cell.rb +22 -0
- data/lib/uniword/wp_drawing/line_to.rb +24 -0
- data/lib/uniword/wp_drawing/locked.rb +22 -0
- data/lib/uniword/wp_drawing/non_visual_drawing_props.rb +20 -0
- data/lib/uniword/wp_drawing/pos_offset.rb +22 -0
- data/lib/uniword/wp_drawing/position_h.rb +27 -0
- data/lib/uniword/wp_drawing/position_v.rb +27 -0
- data/lib/uniword/wp_drawing/relative_height.rb +22 -0
- data/lib/uniword/wp_drawing/simple_pos.rb +24 -0
- data/lib/uniword/wp_drawing/size_rel_h.rb +25 -0
- data/lib/uniword/wp_drawing/size_rel_v.rb +25 -0
- data/lib/uniword/wp_drawing/start.rb +24 -0
- data/lib/uniword/wp_drawing/wrap_none.rb +18 -0
- data/lib/uniword/wp_drawing/wrap_polygon.rb +27 -0
- data/lib/uniword/wp_drawing/wrap_square.rb +33 -0
- data/lib/uniword/wp_drawing/wrap_through.rb +29 -0
- data/lib/uniword/wp_drawing/wrap_tight.rb +29 -0
- data/lib/uniword/wp_drawing/wrap_top_and_bottom.rb +27 -0
- data/lib/uniword/wp_drawing.rb +55 -0
- data/lib/uniword.rb +295 -0
- metadata +1386 -0
|
@@ -0,0 +1,403 @@
|
|
|
1
|
+
# frozen_string_literal: true
|
|
2
|
+
|
|
3
|
+
# All classes autoloaded via lib/uniword/metadata.rb and lib/uniword/configuration.rb
|
|
4
|
+
|
|
5
|
+
module Uniword
|
|
6
|
+
module Metadata
|
|
7
|
+
# Extracts metadata from documents.
|
|
8
|
+
#
|
|
9
|
+
# Responsibility: Extract metadata from document structure.
|
|
10
|
+
# Single Responsibility: Only handles metadata extraction.
|
|
11
|
+
#
|
|
12
|
+
# The MetadataExtractor:
|
|
13
|
+
# - Extracts core properties (title, author, etc.)
|
|
14
|
+
# - Extracts extended properties (company, category, etc.)
|
|
15
|
+
# - Computes statistical metadata (word count, page count, etc.)
|
|
16
|
+
# - Extracts content metadata (headings, first paragraph, etc.)
|
|
17
|
+
#
|
|
18
|
+
# Does NOT handle: Validation, updating, or indexing.
|
|
19
|
+
# Those responsibilities belong to separate classes.
|
|
20
|
+
#
|
|
21
|
+
# @example Extract metadata
|
|
22
|
+
# extractor = MetadataExtractor.new
|
|
23
|
+
# metadata = extractor.extract(document)
|
|
24
|
+
# puts metadata[:word_count]
|
|
25
|
+
#
|
|
26
|
+
# @example Custom config
|
|
27
|
+
# extractor = MetadataExtractor.new(
|
|
28
|
+
# config_file: 'custom_metadata_schema'
|
|
29
|
+
# )
|
|
30
|
+
class MetadataExtractor
|
|
31
|
+
# @return [Hash] Loaded configuration
|
|
32
|
+
attr_reader :config
|
|
33
|
+
|
|
34
|
+
# Initialize a new MetadataExtractor.
|
|
35
|
+
#
|
|
36
|
+
# @param config_file [String] Path to schema configuration
|
|
37
|
+
#
|
|
38
|
+
# @example Create extractor
|
|
39
|
+
# extractor = MetadataExtractor.new
|
|
40
|
+
#
|
|
41
|
+
# @example Custom config
|
|
42
|
+
# extractor = MetadataExtractor.new(
|
|
43
|
+
# config_file: 'config/custom_schema.yml'
|
|
44
|
+
# )
|
|
45
|
+
def initialize(config_file: 'metadata_schema')
|
|
46
|
+
@config = load_configuration(config_file)
|
|
47
|
+
end
|
|
48
|
+
|
|
49
|
+
# Extract metadata from a document.
|
|
50
|
+
#
|
|
51
|
+
# @param document [Document] The document to extract from
|
|
52
|
+
# @return [Metadata] Extracted metadata
|
|
53
|
+
# @raise [ArgumentError] if document is not valid
|
|
54
|
+
#
|
|
55
|
+
# @example Extract metadata
|
|
56
|
+
# metadata = extractor.extract(document)
|
|
57
|
+
# puts metadata[:title]
|
|
58
|
+
# puts metadata[:word_count]
|
|
59
|
+
def extract(document)
|
|
60
|
+
validate_document(document)
|
|
61
|
+
|
|
62
|
+
metadata = Metadata.new
|
|
63
|
+
|
|
64
|
+
# Extract different metadata categories
|
|
65
|
+
extract_core_properties(document, metadata)
|
|
66
|
+
extract_extended_properties(document, metadata)
|
|
67
|
+
extract_statistical_metadata(document, metadata) if extraction_enabled?(:statistics)
|
|
68
|
+
extract_content_metadata(document, metadata) if extraction_enabled?(:content)
|
|
69
|
+
|
|
70
|
+
metadata
|
|
71
|
+
end
|
|
72
|
+
|
|
73
|
+
private
|
|
74
|
+
|
|
75
|
+
# Load configuration from file.
|
|
76
|
+
#
|
|
77
|
+
# @param config_file [String] Configuration file name or path
|
|
78
|
+
# @return [Hash] Loaded configuration
|
|
79
|
+
def load_configuration(config_file)
|
|
80
|
+
if File.exist?(config_file)
|
|
81
|
+
Configuration::ConfigurationLoader.load_file(config_file)
|
|
82
|
+
else
|
|
83
|
+
Configuration::ConfigurationLoader.load(config_file)
|
|
84
|
+
end
|
|
85
|
+
rescue Configuration::ConfigurationError => e
|
|
86
|
+
warn "Warning: #{e.message}. Using default configuration."
|
|
87
|
+
default_configuration
|
|
88
|
+
end
|
|
89
|
+
|
|
90
|
+
# Get default configuration.
|
|
91
|
+
#
|
|
92
|
+
# @return [Hash] Default configuration
|
|
93
|
+
def default_configuration
|
|
94
|
+
{
|
|
95
|
+
extraction_config: {
|
|
96
|
+
statistics: { enabled: true },
|
|
97
|
+
content: { enabled: true }
|
|
98
|
+
}
|
|
99
|
+
}
|
|
100
|
+
end
|
|
101
|
+
|
|
102
|
+
# Validate document.
|
|
103
|
+
#
|
|
104
|
+
# @param document [Object] The document to validate
|
|
105
|
+
# @raise [ArgumentError] if document is invalid
|
|
106
|
+
def validate_document(document)
|
|
107
|
+
return if document.respond_to?(:paragraphs)
|
|
108
|
+
|
|
109
|
+
raise ArgumentError,
|
|
110
|
+
"Document must respond to :paragraphs, got #{document.class}"
|
|
111
|
+
end
|
|
112
|
+
|
|
113
|
+
# Check if extraction is enabled for a category.
|
|
114
|
+
#
|
|
115
|
+
# @param category [Symbol] Category name (:statistics, :content)
|
|
116
|
+
# @return [Boolean] true if enabled
|
|
117
|
+
def extraction_enabled?(category)
|
|
118
|
+
extraction_config = @config[:extraction_config]
|
|
119
|
+
return true unless extraction_config
|
|
120
|
+
|
|
121
|
+
category_config = extraction_config[category]
|
|
122
|
+
return true unless category_config
|
|
123
|
+
|
|
124
|
+
category_config.fetch(:enabled, true)
|
|
125
|
+
end
|
|
126
|
+
|
|
127
|
+
# Extract core properties from document.
|
|
128
|
+
#
|
|
129
|
+
# Core properties include: title, author, subject, keywords, etc.
|
|
130
|
+
#
|
|
131
|
+
# @param document [Document] The document
|
|
132
|
+
# @param metadata [Metadata] Metadata to populate
|
|
133
|
+
def extract_core_properties(document, metadata)
|
|
134
|
+
# Extract from document's core_properties
|
|
135
|
+
props = document.core_properties
|
|
136
|
+
return unless props
|
|
137
|
+
|
|
138
|
+
# Use method access for CoreProperties object
|
|
139
|
+
metadata[:title] = props.title if props.title
|
|
140
|
+
metadata[:subject] = props.subject if props.subject
|
|
141
|
+
metadata[:keywords] = props.keywords if props.keywords
|
|
142
|
+
metadata[:description] = props.description if props.description
|
|
143
|
+
metadata[:creator] = props.creator if props.creator
|
|
144
|
+
metadata[:created_at] = props.created&.value if props.created&.value
|
|
145
|
+
metadata[:modified_at] = props.modified&.value if props.modified&.value
|
|
146
|
+
metadata[:last_modified_by] = props.last_modified_by if props.last_modified_by
|
|
147
|
+
|
|
148
|
+
# If title not found, try to extract from first heading
|
|
149
|
+
metadata[:title] ||= extract_title_from_content(document)
|
|
150
|
+
end
|
|
151
|
+
|
|
152
|
+
# Extract extended properties from document.
|
|
153
|
+
#
|
|
154
|
+
# Extended properties include: company, category, manager, etc.
|
|
155
|
+
#
|
|
156
|
+
# @param document [Document] The document
|
|
157
|
+
# @param metadata [Metadata] Metadata to populate
|
|
158
|
+
def extract_extended_properties(document, metadata)
|
|
159
|
+
return unless document.respond_to?(:extended_properties)
|
|
160
|
+
|
|
161
|
+
props = document.extended_properties
|
|
162
|
+
return unless props
|
|
163
|
+
|
|
164
|
+
metadata[:company] = props[:company] if props[:company]
|
|
165
|
+
metadata[:category] = props[:category] if props[:category]
|
|
166
|
+
metadata[:manager] = props[:manager] if props[:manager]
|
|
167
|
+
metadata[:language] = props[:language] if props[:language]
|
|
168
|
+
metadata[:version] = props[:version] if props[:version]
|
|
169
|
+
metadata[:revision] = props[:revision] if props[:revision]
|
|
170
|
+
metadata[:status] = props[:status] if props[:status]
|
|
171
|
+
end
|
|
172
|
+
|
|
173
|
+
# Extract statistical metadata from document.
|
|
174
|
+
#
|
|
175
|
+
# Statistical metadata includes: word count, page count, etc.
|
|
176
|
+
#
|
|
177
|
+
# @param document [Document] The document
|
|
178
|
+
# @param metadata [Metadata] Metadata to populate
|
|
179
|
+
def extract_statistical_metadata(document, metadata)
|
|
180
|
+
stats_config = @config.dig(:extraction_config, :statistics) || {}
|
|
181
|
+
|
|
182
|
+
# Word count
|
|
183
|
+
metadata[:word_count] = compute_word_count(document) if stats_config.fetch(
|
|
184
|
+
:compute_word_count, true
|
|
185
|
+
)
|
|
186
|
+
|
|
187
|
+
# Character count
|
|
188
|
+
metadata[:character_count] = compute_character_count(document) if stats_config.fetch(
|
|
189
|
+
:compute_character_count, true
|
|
190
|
+
)
|
|
191
|
+
|
|
192
|
+
# Paragraph count
|
|
193
|
+
metadata[:paragraph_count] = document.paragraphs.size
|
|
194
|
+
|
|
195
|
+
# Page count estimate
|
|
196
|
+
if stats_config.fetch(:compute_page_estimate, true)
|
|
197
|
+
words_per_page = stats_config.fetch(:page_estimate_words_per_page, 500)
|
|
198
|
+
metadata[:page_count] = estimate_page_count(
|
|
199
|
+
metadata[:word_count] || 0,
|
|
200
|
+
words_per_page
|
|
201
|
+
)
|
|
202
|
+
end
|
|
203
|
+
|
|
204
|
+
# Table count
|
|
205
|
+
metadata[:table_count] = document.tables.size if document.respond_to?(:tables)
|
|
206
|
+
|
|
207
|
+
# Image count
|
|
208
|
+
metadata[:image_count] = document.images.size if document.respond_to?(:images)
|
|
209
|
+
|
|
210
|
+
# Hyperlink count
|
|
211
|
+
metadata[:hyperlink_count] = document.hyperlinks.size if document.respond_to?(:hyperlinks)
|
|
212
|
+
|
|
213
|
+
# Footnote count
|
|
214
|
+
if document.respond_to?(:footnotes)
|
|
215
|
+
footnotes = document.footnotes
|
|
216
|
+
metadata[:footnote_count] = case footnotes
|
|
217
|
+
when Array
|
|
218
|
+
footnotes.size
|
|
219
|
+
when Hash
|
|
220
|
+
footnotes.size
|
|
221
|
+
else
|
|
222
|
+
0
|
|
223
|
+
end
|
|
224
|
+
end
|
|
225
|
+
|
|
226
|
+
# Endnote count
|
|
227
|
+
return unless document.respond_to?(:endnotes)
|
|
228
|
+
|
|
229
|
+
endnotes = document.endnotes
|
|
230
|
+
metadata[:endnote_count] = case endnotes
|
|
231
|
+
when Array
|
|
232
|
+
endnotes.size
|
|
233
|
+
when Hash
|
|
234
|
+
endnotes.size
|
|
235
|
+
else
|
|
236
|
+
0
|
|
237
|
+
end
|
|
238
|
+
end
|
|
239
|
+
|
|
240
|
+
# Extract content metadata from document.
|
|
241
|
+
#
|
|
242
|
+
# Content metadata includes: headings, first paragraph, etc.
|
|
243
|
+
#
|
|
244
|
+
# @param document [Document] The document
|
|
245
|
+
# @param metadata [Metadata] Metadata to populate
|
|
246
|
+
def extract_content_metadata(document, metadata)
|
|
247
|
+
content_config = @config.dig(:extraction_config, :content) || {}
|
|
248
|
+
|
|
249
|
+
# Extract headings
|
|
250
|
+
if content_config.fetch(:extract_headings, true)
|
|
251
|
+
metadata[:headings] = extract_headings(
|
|
252
|
+
document,
|
|
253
|
+
max_levels: content_config.fetch(:max_heading_levels, 6)
|
|
254
|
+
)
|
|
255
|
+
end
|
|
256
|
+
|
|
257
|
+
# Extract first paragraph
|
|
258
|
+
return unless content_config.fetch(:extract_first_paragraph, true)
|
|
259
|
+
|
|
260
|
+
metadata[:first_paragraph] = extract_first_paragraph(
|
|
261
|
+
document,
|
|
262
|
+
max_length: content_config.fetch(:first_paragraph_max_length, 500)
|
|
263
|
+
)
|
|
264
|
+
end
|
|
265
|
+
|
|
266
|
+
# Extract title from document content.
|
|
267
|
+
#
|
|
268
|
+
# Looks for first heading or first paragraph.
|
|
269
|
+
#
|
|
270
|
+
# @param document [Document] The document
|
|
271
|
+
# @return [String, nil] Extracted title
|
|
272
|
+
def extract_title_from_content(document)
|
|
273
|
+
return nil if document.paragraphs.empty?
|
|
274
|
+
|
|
275
|
+
# Look for first heading-styled paragraph
|
|
276
|
+
first_heading = document.paragraphs.find do |para|
|
|
277
|
+
next false unless para.respond_to?(:style)
|
|
278
|
+
|
|
279
|
+
style = para.style
|
|
280
|
+
style && (style.include?('Heading') || style.include?('heading'))
|
|
281
|
+
end
|
|
282
|
+
|
|
283
|
+
if first_heading
|
|
284
|
+
first_heading.respond_to?(:text) ? first_heading.text : nil
|
|
285
|
+
else
|
|
286
|
+
# Use first paragraph if no heading found
|
|
287
|
+
first_para = document.paragraphs.first
|
|
288
|
+
text = first_para.respond_to?(:text) ? first_para.text : nil
|
|
289
|
+
text && text.length <= 100 ? text : nil
|
|
290
|
+
end
|
|
291
|
+
end
|
|
292
|
+
|
|
293
|
+
# Compute word count for document.
|
|
294
|
+
#
|
|
295
|
+
# @param document [Document] The document
|
|
296
|
+
# @return [Integer] Word count
|
|
297
|
+
def compute_word_count(document)
|
|
298
|
+
text = document.respond_to?(:text) ? document.text : ''
|
|
299
|
+
return 0 if text.nil? || text.empty?
|
|
300
|
+
|
|
301
|
+
# Split by whitespace and count non-empty words
|
|
302
|
+
text.split(/\s+/).reject(&:empty?).size
|
|
303
|
+
end
|
|
304
|
+
|
|
305
|
+
# Compute character count for document.
|
|
306
|
+
#
|
|
307
|
+
# @param document [Document] The document
|
|
308
|
+
# @return [Integer] Character count
|
|
309
|
+
def compute_character_count(document)
|
|
310
|
+
text = document.respond_to?(:text) ? document.text : ''
|
|
311
|
+
return 0 if text.nil?
|
|
312
|
+
|
|
313
|
+
text.length
|
|
314
|
+
end
|
|
315
|
+
|
|
316
|
+
# Estimate page count from word count.
|
|
317
|
+
#
|
|
318
|
+
# @param word_count [Integer] Total word count
|
|
319
|
+
# @param words_per_page [Integer] Estimated words per page
|
|
320
|
+
# @return [Integer] Estimated page count
|
|
321
|
+
def estimate_page_count(word_count, words_per_page)
|
|
322
|
+
return 0 if word_count.zero?
|
|
323
|
+
|
|
324
|
+
(word_count.to_f / words_per_page).ceil.to_i
|
|
325
|
+
end
|
|
326
|
+
|
|
327
|
+
# Extract headings from document.
|
|
328
|
+
#
|
|
329
|
+
# @param document [Document] The document
|
|
330
|
+
# @param max_levels [Integer] Maximum heading levels to extract
|
|
331
|
+
# @return [Array<Hash>] Array of heading data
|
|
332
|
+
def extract_headings(document, max_levels: 6)
|
|
333
|
+
headings = []
|
|
334
|
+
|
|
335
|
+
document.paragraphs.each_with_index do |para, index|
|
|
336
|
+
next unless para.respond_to?(:style)
|
|
337
|
+
|
|
338
|
+
style = para.style
|
|
339
|
+
next unless style
|
|
340
|
+
|
|
341
|
+
# Check if it's a heading style
|
|
342
|
+
level = extract_heading_level(style)
|
|
343
|
+
next unless level && level <= max_levels
|
|
344
|
+
|
|
345
|
+
text = para.respond_to?(:text) ? para.text : ''
|
|
346
|
+
next if text.empty?
|
|
347
|
+
|
|
348
|
+
headings << {
|
|
349
|
+
level: level,
|
|
350
|
+
text: text,
|
|
351
|
+
position: index
|
|
352
|
+
}
|
|
353
|
+
end
|
|
354
|
+
|
|
355
|
+
headings
|
|
356
|
+
end
|
|
357
|
+
|
|
358
|
+
# Extract heading level from style name.
|
|
359
|
+
#
|
|
360
|
+
# @param style [String] Style name
|
|
361
|
+
# @return [Integer, nil] Heading level (1-9) or nil
|
|
362
|
+
def extract_heading_level(style)
|
|
363
|
+
return nil unless style
|
|
364
|
+
|
|
365
|
+
# Match "Heading 1", "Heading1", "heading 1", etc.
|
|
366
|
+
match = style.match(/heading\s*(\d)/i)
|
|
367
|
+
return nil unless match
|
|
368
|
+
|
|
369
|
+
match[1].to_i
|
|
370
|
+
end
|
|
371
|
+
|
|
372
|
+
# Extract first paragraph text.
|
|
373
|
+
#
|
|
374
|
+
# @param document [Document] The document
|
|
375
|
+
# @param max_length [Integer] Maximum text length
|
|
376
|
+
# @return [String, nil] First paragraph text
|
|
377
|
+
def extract_first_paragraph(document, max_length: 500)
|
|
378
|
+
return nil if document.paragraphs.empty?
|
|
379
|
+
|
|
380
|
+
# Find first non-empty paragraph that's not a heading
|
|
381
|
+
first_para = document.paragraphs.find do |para|
|
|
382
|
+
next false unless para.respond_to?(:text)
|
|
383
|
+
|
|
384
|
+
text = para.text
|
|
385
|
+
next false if text.nil? || text.strip.empty?
|
|
386
|
+
|
|
387
|
+
# Skip if it's a heading
|
|
388
|
+
if para.respond_to?(:style)
|
|
389
|
+
style = para.style
|
|
390
|
+
next false if style && (style.include?('Heading') || style.include?('heading'))
|
|
391
|
+
end
|
|
392
|
+
|
|
393
|
+
true
|
|
394
|
+
end
|
|
395
|
+
|
|
396
|
+
return nil unless first_para
|
|
397
|
+
|
|
398
|
+
text = first_para.text.strip
|
|
399
|
+
text.length > max_length ? "#{text[0...max_length]}..." : text
|
|
400
|
+
end
|
|
401
|
+
end
|
|
402
|
+
end
|
|
403
|
+
end
|