PyPI - machine-dialect - Versions diffs - 0.1.0a1__py3-none-any.whl - Mend

machine-dialect 0.1.0a1__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (268) hide show

machine_dialect/__main__.py +667 -0
machine_dialect/agent/__init__.py +5 -0
machine_dialect/agent/agent.py +360 -0
machine_dialect/ast/__init__.py +95 -0
machine_dialect/ast/ast_node.py +35 -0
machine_dialect/ast/call_expression.py +82 -0
machine_dialect/ast/dict_extraction.py +60 -0
machine_dialect/ast/expressions.py +439 -0
machine_dialect/ast/literals.py +309 -0
machine_dialect/ast/program.py +35 -0
machine_dialect/ast/statements.py +1433 -0
machine_dialect/ast/tests/test_ast_string_representation.py +62 -0
machine_dialect/ast/tests/test_boolean_literal.py +29 -0
machine_dialect/ast/tests/test_collection_hir.py +138 -0
machine_dialect/ast/tests/test_define_statement.py +142 -0
machine_dialect/ast/tests/test_desugar.py +541 -0
machine_dialect/ast/tests/test_foreach_desugar.py +245 -0
machine_dialect/cfg/__init__.py +6 -0
machine_dialect/cfg/config.py +156 -0
machine_dialect/cfg/examples.py +221 -0
machine_dialect/cfg/generate_with_ai.py +187 -0
machine_dialect/cfg/openai_generation.py +200 -0
machine_dialect/cfg/parser.py +94 -0
machine_dialect/cfg/tests/__init__.py +1 -0
machine_dialect/cfg/tests/test_cfg_parser.py +252 -0
machine_dialect/cfg/tests/test_config.py +188 -0
machine_dialect/cfg/tests/test_examples.py +391 -0
machine_dialect/cfg/tests/test_generate_with_ai.py +354 -0
machine_dialect/cfg/tests/test_openai_generation.py +256 -0
machine_dialect/codegen/__init__.py +5 -0
machine_dialect/codegen/bytecode_module.py +89 -0
machine_dialect/codegen/bytecode_serializer.py +300 -0
machine_dialect/codegen/opcodes.py +101 -0
machine_dialect/codegen/register_codegen.py +1996 -0
machine_dialect/codegen/symtab.py +208 -0
machine_dialect/codegen/tests/__init__.py +1 -0
machine_dialect/codegen/tests/test_array_operations_codegen.py +295 -0
machine_dialect/codegen/tests/test_bytecode_serializer.py +185 -0
machine_dialect/codegen/tests/test_register_codegen_ssa.py +324 -0
machine_dialect/codegen/tests/test_symtab.py +418 -0
machine_dialect/codegen/vm_serializer.py +621 -0
machine_dialect/compiler/__init__.py +18 -0
machine_dialect/compiler/compiler.py +197 -0
machine_dialect/compiler/config.py +149 -0
machine_dialect/compiler/context.py +149 -0
machine_dialect/compiler/phases/__init__.py +19 -0
machine_dialect/compiler/phases/bytecode_optimization.py +90 -0
machine_dialect/compiler/phases/codegen.py +40 -0
machine_dialect/compiler/phases/hir_generation.py +39 -0
machine_dialect/compiler/phases/mir_generation.py +86 -0
machine_dialect/compiler/phases/optimization.py +110 -0
machine_dialect/compiler/phases/parsing.py +39 -0
machine_dialect/compiler/pipeline.py +143 -0
machine_dialect/compiler/tests/__init__.py +1 -0
machine_dialect/compiler/tests/test_compiler.py +568 -0
machine_dialect/compiler/vm_runner.py +173 -0
machine_dialect/errors/__init__.py +32 -0
machine_dialect/errors/exceptions.py +369 -0
machine_dialect/errors/messages.py +82 -0
machine_dialect/errors/tests/__init__.py +0 -0
machine_dialect/errors/tests/test_expected_token_errors.py +188 -0
machine_dialect/errors/tests/test_name_errors.py +118 -0
machine_dialect/helpers/__init__.py +0 -0
machine_dialect/helpers/stopwords.py +225 -0
machine_dialect/helpers/validators.py +30 -0
machine_dialect/lexer/__init__.py +9 -0
machine_dialect/lexer/constants.py +23 -0
machine_dialect/lexer/lexer.py +907 -0
machine_dialect/lexer/tests/__init__.py +0 -0
machine_dialect/lexer/tests/helpers.py +86 -0
machine_dialect/lexer/tests/test_apostrophe_identifiers.py +122 -0
machine_dialect/lexer/tests/test_backtick_identifiers.py +140 -0
machine_dialect/lexer/tests/test_boolean_literals.py +108 -0
machine_dialect/lexer/tests/test_case_insensitive_keywords.py +188 -0
machine_dialect/lexer/tests/test_comments.py +200 -0
machine_dialect/lexer/tests/test_double_asterisk_keywords.py +127 -0
machine_dialect/lexer/tests/test_lexer_position.py +113 -0
machine_dialect/lexer/tests/test_list_tokens.py +282 -0
machine_dialect/lexer/tests/test_stopwords.py +80 -0
machine_dialect/lexer/tests/test_strict_equality.py +129 -0
machine_dialect/lexer/tests/test_token.py +41 -0
machine_dialect/lexer/tests/test_tokenization.py +294 -0
machine_dialect/lexer/tests/test_underscore_literals.py +343 -0
machine_dialect/lexer/tests/test_url_literals.py +169 -0
machine_dialect/lexer/tokens.py +487 -0
machine_dialect/linter/__init__.py +10 -0
machine_dialect/linter/__main__.py +144 -0
machine_dialect/linter/linter.py +154 -0
machine_dialect/linter/rules/__init__.py +8 -0
machine_dialect/linter/rules/base.py +112 -0
machine_dialect/linter/rules/statement_termination.py +99 -0
machine_dialect/linter/tests/__init__.py +1 -0
machine_dialect/linter/tests/mdrules/__init__.py +0 -0
machine_dialect/linter/tests/mdrules/test_md101_statement_termination.py +181 -0
machine_dialect/linter/tests/test_linter.py +81 -0
machine_dialect/linter/tests/test_rules.py +110 -0
machine_dialect/linter/tests/test_violations.py +71 -0
machine_dialect/linter/violations.py +51 -0
machine_dialect/mir/__init__.py +69 -0
machine_dialect/mir/analyses/__init__.py +20 -0
machine_dialect/mir/analyses/alias_analysis.py +315 -0
machine_dialect/mir/analyses/dominance_analysis.py +49 -0
machine_dialect/mir/analyses/escape_analysis.py +286 -0
machine_dialect/mir/analyses/loop_analysis.py +272 -0
machine_dialect/mir/analyses/tests/test_type_analysis.py +736 -0
machine_dialect/mir/analyses/type_analysis.py +448 -0
machine_dialect/mir/analyses/use_def_chains.py +232 -0
machine_dialect/mir/basic_block.py +385 -0
machine_dialect/mir/dataflow.py +445 -0
machine_dialect/mir/debug_info.py +208 -0
machine_dialect/mir/hir_to_mir.py +1738 -0
machine_dialect/mir/mir_dumper.py +366 -0
machine_dialect/mir/mir_function.py +167 -0
machine_dialect/mir/mir_instructions.py +1877 -0
machine_dialect/mir/mir_interpreter.py +556 -0
machine_dialect/mir/mir_module.py +225 -0
machine_dialect/mir/mir_printer.py +480 -0
machine_dialect/mir/mir_transformer.py +410 -0
machine_dialect/mir/mir_types.py +367 -0
machine_dialect/mir/mir_validation.py +455 -0
machine_dialect/mir/mir_values.py +268 -0
machine_dialect/mir/optimization_config.py +233 -0
machine_dialect/mir/optimization_pass.py +251 -0
machine_dialect/mir/optimization_pipeline.py +355 -0
machine_dialect/mir/optimizations/__init__.py +84 -0
machine_dialect/mir/optimizations/algebraic_simplification.py +733 -0
machine_dialect/mir/optimizations/branch_prediction.py +372 -0
machine_dialect/mir/optimizations/constant_propagation.py +634 -0
machine_dialect/mir/optimizations/cse.py +398 -0
machine_dialect/mir/optimizations/dce.py +288 -0
machine_dialect/mir/optimizations/inlining.py +551 -0
machine_dialect/mir/optimizations/jump_threading.py +487 -0
machine_dialect/mir/optimizations/licm.py +405 -0
machine_dialect/mir/optimizations/loop_unrolling.py +366 -0
machine_dialect/mir/optimizations/strength_reduction.py +422 -0
machine_dialect/mir/optimizations/tail_call.py +207 -0
machine_dialect/mir/optimizations/tests/test_loop_unrolling.py +483 -0
machine_dialect/mir/optimizations/type_narrowing.py +397 -0
machine_dialect/mir/optimizations/type_specialization.py +447 -0
machine_dialect/mir/optimizations/type_specific.py +906 -0
machine_dialect/mir/optimize_mir.py +89 -0
machine_dialect/mir/pass_manager.py +391 -0
machine_dialect/mir/profiling/__init__.py +26 -0
machine_dialect/mir/profiling/profile_collector.py +318 -0
machine_dialect/mir/profiling/profile_data.py +372 -0
machine_dialect/mir/profiling/profile_reader.py +272 -0
machine_dialect/mir/profiling/profile_writer.py +226 -0
machine_dialect/mir/register_allocation.py +302 -0
machine_dialect/mir/reporting/__init__.py +17 -0
machine_dialect/mir/reporting/optimization_reporter.py +314 -0
machine_dialect/mir/reporting/report_formatter.py +289 -0
machine_dialect/mir/ssa_construction.py +342 -0
machine_dialect/mir/tests/__init__.py +1 -0
machine_dialect/mir/tests/test_algebraic_associativity.py +204 -0
machine_dialect/mir/tests/test_algebraic_complex_patterns.py +221 -0
machine_dialect/mir/tests/test_algebraic_division.py +126 -0
machine_dialect/mir/tests/test_algebraic_simplification.py +863 -0
machine_dialect/mir/tests/test_basic_block.py +425 -0
machine_dialect/mir/tests/test_branch_prediction.py +459 -0
machine_dialect/mir/tests/test_call_lowering.py +168 -0
machine_dialect/mir/tests/test_collection_lowering.py +604 -0
machine_dialect/mir/tests/test_cross_block_constant_propagation.py +255 -0
machine_dialect/mir/tests/test_custom_passes.py +166 -0
machine_dialect/mir/tests/test_debug_info.py +285 -0
machine_dialect/mir/tests/test_dict_extraction_lowering.py +192 -0
machine_dialect/mir/tests/test_dictionary_lowering.py +299 -0
machine_dialect/mir/tests/test_double_negation.py +231 -0
machine_dialect/mir/tests/test_escape_analysis.py +233 -0
machine_dialect/mir/tests/test_hir_to_mir.py +465 -0
machine_dialect/mir/tests/test_hir_to_mir_complete.py +389 -0
machine_dialect/mir/tests/test_hir_to_mir_simple.py +130 -0
machine_dialect/mir/tests/test_inlining.py +435 -0
machine_dialect/mir/tests/test_licm.py +472 -0
machine_dialect/mir/tests/test_mir_dumper.py +313 -0
machine_dialect/mir/tests/test_mir_instructions.py +445 -0
machine_dialect/mir/tests/test_mir_module.py +860 -0
machine_dialect/mir/tests/test_mir_printer.py +387 -0
machine_dialect/mir/tests/test_mir_types.py +123 -0
machine_dialect/mir/tests/test_mir_types_enhanced.py +132 -0
machine_dialect/mir/tests/test_mir_validation.py +378 -0
machine_dialect/mir/tests/test_mir_values.py +168 -0
machine_dialect/mir/tests/test_one_based_indexing.py +202 -0
machine_dialect/mir/tests/test_optimization_helpers.py +60 -0
machine_dialect/mir/tests/test_optimization_pipeline.py +554 -0
machine_dialect/mir/tests/test_optimization_reporter.py +318 -0
machine_dialect/mir/tests/test_pass_manager.py +294 -0
machine_dialect/mir/tests/test_pass_registration.py +64 -0
machine_dialect/mir/tests/test_profiling.py +356 -0
machine_dialect/mir/tests/test_register_allocation.py +307 -0
machine_dialect/mir/tests/test_report_formatters.py +372 -0
machine_dialect/mir/tests/test_ssa_construction.py +433 -0
machine_dialect/mir/tests/test_tail_call.py +236 -0
machine_dialect/mir/tests/test_type_annotated_instructions.py +192 -0
machine_dialect/mir/tests/test_type_narrowing.py +277 -0
machine_dialect/mir/tests/test_type_specialization.py +421 -0
machine_dialect/mir/tests/test_type_specific_optimization.py +545 -0
machine_dialect/mir/tests/test_type_specific_optimization_advanced.py +382 -0
machine_dialect/mir/type_inference.py +368 -0
machine_dialect/parser/__init__.py +12 -0
machine_dialect/parser/enums.py +45 -0
machine_dialect/parser/parser.py +3655 -0
machine_dialect/parser/protocols.py +11 -0
machine_dialect/parser/symbol_table.py +169 -0
machine_dialect/parser/tests/__init__.py +0 -0
machine_dialect/parser/tests/helper_functions.py +193 -0
machine_dialect/parser/tests/test_action_statements.py +334 -0
machine_dialect/parser/tests/test_boolean_literal_expressions.py +152 -0
machine_dialect/parser/tests/test_call_statements.py +154 -0
machine_dialect/parser/tests/test_call_statements_errors.py +187 -0
machine_dialect/parser/tests/test_collection_mutations.py +264 -0
machine_dialect/parser/tests/test_conditional_expressions.py +343 -0
machine_dialect/parser/tests/test_define_integration.py +468 -0
machine_dialect/parser/tests/test_define_statements.py +311 -0
machine_dialect/parser/tests/test_dict_extraction.py +115 -0
machine_dialect/parser/tests/test_empty_literal.py +155 -0
machine_dialect/parser/tests/test_float_literal_expressions.py +163 -0
machine_dialect/parser/tests/test_identifier_expressions.py +57 -0
machine_dialect/parser/tests/test_if_empty_block.py +61 -0
machine_dialect/parser/tests/test_if_statements.py +299 -0
machine_dialect/parser/tests/test_illegal_tokens.py +86 -0
machine_dialect/parser/tests/test_infix_expressions.py +680 -0
machine_dialect/parser/tests/test_integer_literal_expressions.py +137 -0
machine_dialect/parser/tests/test_interaction_statements.py +269 -0
machine_dialect/parser/tests/test_list_literals.py +277 -0
machine_dialect/parser/tests/test_no_none_in_ast.py +94 -0
machine_dialect/parser/tests/test_panic_mode_recovery.py +171 -0
machine_dialect/parser/tests/test_parse_errors.py +114 -0
machine_dialect/parser/tests/test_possessive_syntax.py +182 -0
machine_dialect/parser/tests/test_prefix_expressions.py +415 -0
machine_dialect/parser/tests/test_program.py +13 -0
machine_dialect/parser/tests/test_return_statements.py +89 -0
machine_dialect/parser/tests/test_set_statements.py +152 -0
machine_dialect/parser/tests/test_strict_equality.py +258 -0
machine_dialect/parser/tests/test_symbol_table.py +217 -0
machine_dialect/parser/tests/test_url_literal_expressions.py +209 -0
machine_dialect/parser/tests/test_utility_statements.py +423 -0
machine_dialect/parser/token_buffer.py +159 -0
machine_dialect/repl/__init__.py +3 -0
machine_dialect/repl/repl.py +426 -0
machine_dialect/repl/tests/__init__.py +0 -0
machine_dialect/repl/tests/test_repl.py +606 -0
machine_dialect/semantic/__init__.py +12 -0
machine_dialect/semantic/analyzer.py +906 -0
machine_dialect/semantic/error_messages.py +189 -0
machine_dialect/semantic/tests/__init__.py +1 -0
machine_dialect/semantic/tests/test_analyzer.py +364 -0
machine_dialect/semantic/tests/test_error_messages.py +104 -0
machine_dialect/tests/edge_cases/__init__.py +10 -0
machine_dialect/tests/edge_cases/test_boundary_access.py +256 -0
machine_dialect/tests/edge_cases/test_empty_collections.py +166 -0
machine_dialect/tests/edge_cases/test_invalid_operations.py +243 -0
machine_dialect/tests/edge_cases/test_named_list_edge_cases.py +295 -0
machine_dialect/tests/edge_cases/test_nested_structures.py +313 -0
machine_dialect/tests/edge_cases/test_type_mixing.py +277 -0
machine_dialect/tests/integration/test_array_operations_emulation.py +248 -0
machine_dialect/tests/integration/test_list_compilation.py +395 -0
machine_dialect/tests/integration/test_lists_and_dictionaries.py +322 -0
machine_dialect/type_checking/__init__.py +21 -0
machine_dialect/type_checking/tests/__init__.py +1 -0
machine_dialect/type_checking/tests/test_type_system.py +230 -0
machine_dialect/type_checking/type_system.py +270 -0
machine_dialect-0.1.0a1.dist-info/METADATA +128 -0
machine_dialect-0.1.0a1.dist-info/RECORD +268 -0
machine_dialect-0.1.0a1.dist-info/WHEEL +5 -0
machine_dialect-0.1.0a1.dist-info/entry_points.txt +3 -0
machine_dialect-0.1.0a1.dist-info/licenses/LICENSE +201 -0
machine_dialect-0.1.0a1.dist-info/top_level.txt +2 -0
machine_dialect_vm/__init__.pyi +15 -0

machine_dialect/mir/profiling/profile_reader.py ADDED Viewed

@@ -0,0 +1,272 @@
+"""Profile reader for loading persisted profile data.
+This module implements deserialization of profile data from disk
+for use in profile-guided optimization.
+"""
+import json
+from pathlib import Path
+from typing import Any
+from machine_dialect.mir.profiling.profile_data import (
+    BasicBlockProfile,
+    BranchProfile,
+    FunctionProfile,
+    IndirectCallProfile,
+    LoopProfile,
+    ProfileData,
+)
+class ProfileReader:
+    """Reads profile data from disk in various formats."""
+    def __init__(self) -> None:
+        """Initialize the profile reader."""
+        pass
+    def read_json(self, filepath: Path | str) -> ProfileData:
+        """Read profile data from JSON format.
+        Args:
+            filepath: Path to input file.
+        Returns:
+            Loaded profile data.
+        Raises:
+            FileNotFoundError: If file doesn't exist.
+            json.JSONDecodeError: If file is not valid JSON.
+        """
+        filepath = Path(filepath)
+        if not filepath.exists():
+            raise FileNotFoundError(f"Profile file not found: {filepath}")
+        with open(filepath) as f:
+            data = json.load(f)
+        return self._dict_to_profile(data)
+    def read_binary(self, filepath: Path | str) -> ProfileData:
+        """Read profile data from binary format.
+        Args:
+            filepath: Path to input file.
+        Returns:
+            Loaded profile data.
+        Raises:
+            FileNotFoundError: If file doesn't exist.
+            pickle.UnpicklingError: If file is not valid pickle format.
+        """
+        import pickle
+        filepath = Path(filepath)
+        if not filepath.exists():
+            raise FileNotFoundError(f"Profile file not found: {filepath}")
+        with open(filepath, "rb") as f:
+            data = pickle.load(f)
+            if not isinstance(data, ProfileData):
+                raise ValueError(f"Invalid profile data type: {type(data)}")
+            return data
+    def read_auto(self, filepath: Path | str) -> ProfileData:
+        """Automatically detect format and read profile data.
+        Args:
+            filepath: Path to input file.
+        Returns:
+            Loaded profile data.
+        Raises:
+            FileNotFoundError: If file doesn't exist.
+            ValueError: If format cannot be determined.
+        """
+        filepath = Path(filepath)
+        if not filepath.exists():
+            raise FileNotFoundError(f"Profile file not found: {filepath}")
+        # Try to detect format by extension
+        if filepath.suffix == ".json":
+            return self.read_json(filepath)
+        elif filepath.suffix in [".pkl", ".pickle", ".bin"]:
+            return self.read_binary(filepath)
+        # Try to detect by content
+        try:
+            return self.read_json(filepath)
+        except json.JSONDecodeError:
+            try:
+                return self.read_binary(filepath)
+            except Exception as e:
+                raise ValueError(f"Cannot determine profile format: {e}") from e
+    def merge_profiles(self, filepaths: list[Path | str]) -> ProfileData:
+        """Merge multiple profile files into one.
+        Args:
+            filepaths: List of profile file paths.
+        Returns:
+            Merged profile data.
+        """
+        if not filepaths:
+            raise ValueError("No profile files provided")
+        # Read first profile as base
+        merged = self.read_auto(filepaths[0])
+        # Merge remaining profiles
+        for filepath in filepaths[1:]:
+            profile = self.read_auto(filepath)
+            merged.merge(profile)
+        return merged
+    def _dict_to_profile(self, data: dict[str, Any]) -> ProfileData:
+        """Convert dictionary to profile data.
+        Args:
+            data: Dictionary representation.
+        Returns:
+            Profile data object.
+        """
+        profile = ProfileData(
+            module_name=data.get("module_name", "default"),
+            total_samples=data.get("total_samples", 0),
+            metadata=data.get("metadata", {}),
+        )
+        # Load functions
+        for name, func_data in data.get("functions", {}).items():
+            profile.functions[name] = self._dict_to_function(func_data)
+        # Load branches
+        for loc, branch_data in data.get("branches", {}).items():
+            profile.branches[loc] = self._dict_to_branch(branch_data)
+        # Load loops
+        for loc, loop_data in data.get("loops", {}).items():
+            profile.loops[loc] = self._dict_to_loop(loop_data)
+        # Load blocks
+        for loc, block_data in data.get("blocks", {}).items():
+            profile.blocks[loc] = self._dict_to_block(block_data)
+        # Load indirect calls
+        for loc, call_data in data.get("indirect_calls", {}).items():
+            profile.indirect_calls[loc] = self._dict_to_indirect_call(call_data)
+        return profile
+    def _dict_to_function(self, data: dict[str, Any]) -> FunctionProfile:
+        """Convert dictionary to function profile."""
+        profile = FunctionProfile(
+            name=data["name"],
+            call_count=data.get("call_count", 0),
+            total_cycles=data.get("total_cycles", 0),
+            avg_cycles=data.get("avg_cycles", 0.0),
+            call_sites=data.get("call_sites", {}),
+            hot=data.get("hot", False),
+            inline_benefit=data.get("inline_benefit", 0.0),
+        )
+        return profile
+    def _dict_to_branch(self, data: dict[str, Any]) -> BranchProfile:
+        """Convert dictionary to branch profile."""
+        profile = BranchProfile(
+            location=data["location"],
+            taken_count=data.get("taken_count", 0),
+            not_taken_count=data.get("not_taken_count", 0),
+            taken_probability=data.get("taken_probability", 0.5),
+            predictable=data.get("predictable", False),
+        )
+        return profile
+    def _dict_to_loop(self, data: dict[str, Any]) -> LoopProfile:
+        """Convert dictionary to loop profile."""
+        min_iter_raw = data.get("min_iterations")
+        min_iter: int = 2**31 - 1  # Use max int instead of infinity
+        if min_iter_raw is not None:
+            min_iter = int(min_iter_raw)
+        profile = LoopProfile(
+            location=data["location"],
+            entry_count=data.get("entry_count", 0),
+            total_iterations=data.get("total_iterations", 0),
+            avg_iterations=data.get("avg_iterations", 0.0),
+            max_iterations=data.get("max_iterations", 0),
+            min_iterations=min_iter,
+            hot=data.get("hot", False),
+            unroll_benefit=data.get("unroll_benefit", 0.0),
+        )
+        return profile
+    def _dict_to_block(self, data: dict[str, Any]) -> BasicBlockProfile:
+        """Convert dictionary to basic block profile."""
+        profile = BasicBlockProfile(
+            location=data["location"],
+            execution_count=data.get("execution_count", 0),
+            instruction_count=data.get("instruction_count", 0),
+            total_cycles=data.get("total_cycles", 0),
+            avg_cycles=data.get("avg_cycles", 0.0),
+            hot=data.get("hot", False),
+        )
+        return profile
+    def _dict_to_indirect_call(self, data: dict[str, Any]) -> IndirectCallProfile:
+        """Convert dictionary to indirect call profile."""
+        profile = IndirectCallProfile(
+            location=data["location"],
+            targets=data.get("targets", {}),
+            total_calls=data.get("total_calls", 0),
+            most_common_target=data.get("most_common_target"),
+            devirtualization_benefit=data.get("devirtualization_benefit", 0.0),
+        )
+        return profile
+    def validate_profile(self, profile_data: ProfileData) -> list[str]:
+        """Validate profile data for consistency.
+        Args:
+            profile_data: Profile data to validate.
+        Returns:
+            List of validation warnings/errors.
+        """
+        warnings = []
+        # Check for empty profile
+        if profile_data.total_samples == 0:
+            warnings.append("Profile has no samples")
+        # Check function consistency
+        for name, func in profile_data.functions.items():
+            if func.call_count == 0 and func.total_cycles > 0:
+                warnings.append(f"Function {name} has cycles but no calls")
+            if func.call_count > 0 and func.avg_cycles == 0:
+                warnings.append(f"Function {name} has calls but no average cycles")
+        # Check branch consistency
+        for loc, branch in profile_data.branches.items():
+            total = branch.taken_count + branch.not_taken_count
+            if total == 0:
+                warnings.append(f"Branch {loc} has no executions")
+            elif abs(branch.taken_probability - (branch.taken_count / total)) > 0.01:
+                warnings.append(f"Branch {loc} has inconsistent probability")
+        # Check loop consistency
+        for loc, loop in profile_data.loops.items():
+            if loop.entry_count == 0 and loop.total_iterations > 0:
+                warnings.append(f"Loop {loc} has iterations but no entries")
+            if loop.max_iterations < loop.min_iterations:
+                warnings.append(f"Loop {loc} has max < min iterations")
+        return warnings

machine_dialect/mir/profiling/profile_writer.py ADDED Viewed

@@ -0,0 +1,226 @@
+"""Profile writer for persisting profile data.
+This module implements serialization of profile data to disk for
+reuse across compilation sessions.
+"""
+import json
+from pathlib import Path
+from typing import Any
+from machine_dialect.mir.profiling.profile_data import (
+    BasicBlockProfile,
+    BranchProfile,
+    FunctionProfile,
+    IndirectCallProfile,
+    LoopProfile,
+    ProfileData,
+)
+class ProfileWriter:
+    """Writes profile data to disk in various formats."""
+    def __init__(self) -> None:
+        """Initialize the profile writer."""
+        pass
+    def write_json(self, profile_data: ProfileData, filepath: Path | str) -> None:
+        """Write profile data to JSON format.
+        Args:
+            profile_data: Profile data to write.
+            filepath: Path to output file.
+        """
+        filepath = Path(filepath)
+        filepath.parent.mkdir(parents=True, exist_ok=True)
+        # Convert profile data to JSON-serializable format
+        data = self._profile_to_dict(profile_data)
+        # Write to file with pretty formatting
+        with open(filepath, "w") as f:
+            json.dump(data, f, indent=2, sort_keys=True)
+    def write_binary(self, profile_data: ProfileData, filepath: Path | str) -> None:
+        """Write profile data to efficient binary format.
+        Args:
+            profile_data: Profile data to write.
+            filepath: Path to output file.
+        """
+        import pickle
+        filepath = Path(filepath)
+        filepath.parent.mkdir(parents=True, exist_ok=True)
+        # Use pickle for binary serialization
+        with open(filepath, "wb") as f:
+            pickle.dump(profile_data, f, protocol=pickle.HIGHEST_PROTOCOL)
+    def write_summary(self, profile_data: ProfileData, filepath: Path | str) -> None:
+        """Write human-readable profile summary.
+        Args:
+            profile_data: Profile data to summarize.
+            filepath: Path to output file.
+        """
+        filepath = Path(filepath)
+        filepath.parent.mkdir(parents=True, exist_ok=True)
+        with open(filepath, "w") as f:
+            # Write header
+            f.write(f"Profile Summary for Module: {profile_data.module_name}\n")
+            f.write("=" * 60 + "\n\n")
+            # Write statistics
+            summary = profile_data.get_summary()
+            f.write(f"Total Samples: {summary['total_samples']}\n\n")
+            # Function statistics
+            f.write("Functions:\n")
+            f.write(f"  Total: {summary['functions']['total']}\n")
+            f.write(f"  Hot: {summary['functions']['hot']}\n\n")
+            # Hot functions details
+            if profile_data.functions:
+                f.write("Hot Functions (Top 10):\n")
+                sorted_funcs = sorted(profile_data.functions.values(), key=lambda x: x.call_count, reverse=True)[:10]
+                for func in sorted_funcs:
+                    f.write(f"  {func.name}:\n")
+                    f.write(f"    Calls: {func.call_count}\n")
+                    f.write(f"    Avg Cycles: {func.avg_cycles:.2f}\n")
+                    if func.inline_benefit > 0:
+                        f.write(f"    Inline Benefit: {func.inline_benefit:.2f}\n")
+                f.write("\n")
+            # Branch statistics
+            f.write("Branches:\n")
+            f.write(f"  Total: {summary['branches']['total']}\n")
+            f.write(f"  Predictable: {summary['branches']['predictable']}\n\n")
+            # Predictable branches details
+            predictable = [b for b in profile_data.branches.values() if b.predictable]
+            if predictable:
+                f.write("Predictable Branches (Top 10):\n")
+                for branch in predictable[:10]:
+                    f.write(f"  {branch.location}:\n")
+                    f.write(f"    Taken: {branch.taken_probability:.1%}\n")
+                f.write("\n")
+            # Loop statistics
+            f.write("Loops:\n")
+            f.write(f"  Total: {summary['loops']['total']}\n")
+            f.write(f"  Hot: {summary['loops']['hot']}\n\n")
+            # Hot loops details
+            hot_loops = [loop for loop in profile_data.loops.values() if loop.hot]
+            if hot_loops:
+                f.write("Hot Loops (Top 10):\n")
+                sorted_loops = sorted(hot_loops, key=lambda x: x.total_iterations, reverse=True)[:10]
+                for loop in sorted_loops:
+                    f.write(f"  {loop.location}:\n")
+                    f.write(f"    Iterations: {loop.total_iterations}\n")
+                    f.write(f"    Avg per Entry: {loop.avg_iterations:.2f}\n")
+                    if loop.unroll_benefit > 0:
+                        f.write(f"    Unroll Benefit: {loop.unroll_benefit:.2f}\n")
+                f.write("\n")
+            # Indirect call statistics
+            f.write("Indirect Calls:\n")
+            f.write(f"  Total: {summary['indirect_calls']['total']}\n")
+            f.write(f"  Devirtualizable: {summary['indirect_calls']['devirtualizable']}\n\n")
+            # Devirtualization opportunities
+            devirt = [c for c in profile_data.indirect_calls.values() if c.devirtualization_benefit > 50]
+            if devirt:
+                f.write("Devirtualization Opportunities:\n")
+                for call in devirt:
+                    f.write(f"  {call.location}:\n")
+                    f.write(f"    Target: {call.most_common_target}\n")
+                    f.write(f"    Benefit: {call.devirtualization_benefit:.2f}\n")
+    def _profile_to_dict(self, profile_data: ProfileData) -> dict[str, Any]:
+        """Convert profile data to dictionary.
+        Args:
+            profile_data: Profile data to convert.
+        Returns:
+            Dictionary representation.
+        """
+        return {
+            "module_name": profile_data.module_name,
+            "total_samples": profile_data.total_samples,
+            "metadata": profile_data.metadata,
+            "functions": {name: self._function_to_dict(prof) for name, prof in profile_data.functions.items()},
+            "branches": {loc: self._branch_to_dict(prof) for loc, prof in profile_data.branches.items()},
+            "loops": {loc: self._loop_to_dict(prof) for loc, prof in profile_data.loops.items()},
+            "blocks": {loc: self._block_to_dict(prof) for loc, prof in profile_data.blocks.items()},
+            "indirect_calls": {
+                loc: self._indirect_call_to_dict(prof) for loc, prof in profile_data.indirect_calls.items()
+            },
+        }
+    def _function_to_dict(self, profile: FunctionProfile) -> dict[str, Any]:
+        """Convert function profile to dictionary."""
+        return {
+            "name": profile.name,
+            "call_count": profile.call_count,
+            "total_cycles": profile.total_cycles,
+            "avg_cycles": profile.avg_cycles,
+            "call_sites": profile.call_sites,
+            "hot": profile.hot,
+            "inline_benefit": profile.inline_benefit,
+        }
+    def _branch_to_dict(self, profile: BranchProfile) -> dict[str, Any]:
+        """Convert branch profile to dictionary."""
+        return {
+            "location": profile.location,
+            "taken_count": profile.taken_count,
+            "not_taken_count": profile.not_taken_count,
+            "taken_probability": profile.taken_probability,
+            "predictable": profile.predictable,
+        }
+    def _loop_to_dict(self, profile: LoopProfile) -> dict[str, Any]:
+        """Convert loop profile to dictionary."""
+        # Handle max int as None for JSON
+        min_iter = profile.min_iterations
+        if min_iter == 2**31 - 1:  # Max int sentinel value
+            min_iter_value: int | None = None
+        else:
+            min_iter_value = min_iter
+        return {
+            "location": profile.location,
+            "entry_count": profile.entry_count,
+            "total_iterations": profile.total_iterations,
+            "avg_iterations": profile.avg_iterations,
+            "max_iterations": profile.max_iterations,
+            "min_iterations": min_iter_value,
+            "hot": profile.hot,
+            "unroll_benefit": profile.unroll_benefit,
+        }
+    def _block_to_dict(self, profile: BasicBlockProfile) -> dict[str, Any]:
+        """Convert basic block profile to dictionary."""
+        return {
+            "location": profile.location,
+            "execution_count": profile.execution_count,
+            "instruction_count": profile.instruction_count,
+            "total_cycles": profile.total_cycles,
+            "avg_cycles": profile.avg_cycles,
+            "hot": profile.hot,
+        }
+    def _indirect_call_to_dict(self, profile: IndirectCallProfile) -> dict[str, Any]:
+        """Convert indirect call profile to dictionary."""
+        return {
+            "location": profile.location,
+            "targets": profile.targets,
+            "total_calls": profile.total_calls,
+            "most_common_target": profile.most_common_target,
+            "devirtualization_benefit": profile.devirtualization_benefit,
+        }