PyPI - machine-dialect - Versions diffs - 0.1.0a1__py3-none-any.whl - Mend

machine-dialect 0.1.0a1__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (268) hide show

machine_dialect/__main__.py +667 -0
machine_dialect/agent/__init__.py +5 -0
machine_dialect/agent/agent.py +360 -0
machine_dialect/ast/__init__.py +95 -0
machine_dialect/ast/ast_node.py +35 -0
machine_dialect/ast/call_expression.py +82 -0
machine_dialect/ast/dict_extraction.py +60 -0
machine_dialect/ast/expressions.py +439 -0
machine_dialect/ast/literals.py +309 -0
machine_dialect/ast/program.py +35 -0
machine_dialect/ast/statements.py +1433 -0
machine_dialect/ast/tests/test_ast_string_representation.py +62 -0
machine_dialect/ast/tests/test_boolean_literal.py +29 -0
machine_dialect/ast/tests/test_collection_hir.py +138 -0
machine_dialect/ast/tests/test_define_statement.py +142 -0
machine_dialect/ast/tests/test_desugar.py +541 -0
machine_dialect/ast/tests/test_foreach_desugar.py +245 -0
machine_dialect/cfg/__init__.py +6 -0
machine_dialect/cfg/config.py +156 -0
machine_dialect/cfg/examples.py +221 -0
machine_dialect/cfg/generate_with_ai.py +187 -0
machine_dialect/cfg/openai_generation.py +200 -0
machine_dialect/cfg/parser.py +94 -0
machine_dialect/cfg/tests/__init__.py +1 -0
machine_dialect/cfg/tests/test_cfg_parser.py +252 -0
machine_dialect/cfg/tests/test_config.py +188 -0
machine_dialect/cfg/tests/test_examples.py +391 -0
machine_dialect/cfg/tests/test_generate_with_ai.py +354 -0
machine_dialect/cfg/tests/test_openai_generation.py +256 -0
machine_dialect/codegen/__init__.py +5 -0
machine_dialect/codegen/bytecode_module.py +89 -0
machine_dialect/codegen/bytecode_serializer.py +300 -0
machine_dialect/codegen/opcodes.py +101 -0
machine_dialect/codegen/register_codegen.py +1996 -0
machine_dialect/codegen/symtab.py +208 -0
machine_dialect/codegen/tests/__init__.py +1 -0
machine_dialect/codegen/tests/test_array_operations_codegen.py +295 -0
machine_dialect/codegen/tests/test_bytecode_serializer.py +185 -0
machine_dialect/codegen/tests/test_register_codegen_ssa.py +324 -0
machine_dialect/codegen/tests/test_symtab.py +418 -0
machine_dialect/codegen/vm_serializer.py +621 -0
machine_dialect/compiler/__init__.py +18 -0
machine_dialect/compiler/compiler.py +197 -0
machine_dialect/compiler/config.py +149 -0
machine_dialect/compiler/context.py +149 -0
machine_dialect/compiler/phases/__init__.py +19 -0
machine_dialect/compiler/phases/bytecode_optimization.py +90 -0
machine_dialect/compiler/phases/codegen.py +40 -0
machine_dialect/compiler/phases/hir_generation.py +39 -0
machine_dialect/compiler/phases/mir_generation.py +86 -0
machine_dialect/compiler/phases/optimization.py +110 -0
machine_dialect/compiler/phases/parsing.py +39 -0
machine_dialect/compiler/pipeline.py +143 -0
machine_dialect/compiler/tests/__init__.py +1 -0
machine_dialect/compiler/tests/test_compiler.py +568 -0
machine_dialect/compiler/vm_runner.py +173 -0
machine_dialect/errors/__init__.py +32 -0
machine_dialect/errors/exceptions.py +369 -0
machine_dialect/errors/messages.py +82 -0
machine_dialect/errors/tests/__init__.py +0 -0
machine_dialect/errors/tests/test_expected_token_errors.py +188 -0
machine_dialect/errors/tests/test_name_errors.py +118 -0
machine_dialect/helpers/__init__.py +0 -0
machine_dialect/helpers/stopwords.py +225 -0
machine_dialect/helpers/validators.py +30 -0
machine_dialect/lexer/__init__.py +9 -0
machine_dialect/lexer/constants.py +23 -0
machine_dialect/lexer/lexer.py +907 -0
machine_dialect/lexer/tests/__init__.py +0 -0
machine_dialect/lexer/tests/helpers.py +86 -0
machine_dialect/lexer/tests/test_apostrophe_identifiers.py +122 -0
machine_dialect/lexer/tests/test_backtick_identifiers.py +140 -0
machine_dialect/lexer/tests/test_boolean_literals.py +108 -0
machine_dialect/lexer/tests/test_case_insensitive_keywords.py +188 -0
machine_dialect/lexer/tests/test_comments.py +200 -0
machine_dialect/lexer/tests/test_double_asterisk_keywords.py +127 -0
machine_dialect/lexer/tests/test_lexer_position.py +113 -0
machine_dialect/lexer/tests/test_list_tokens.py +282 -0
machine_dialect/lexer/tests/test_stopwords.py +80 -0
machine_dialect/lexer/tests/test_strict_equality.py +129 -0
machine_dialect/lexer/tests/test_token.py +41 -0
machine_dialect/lexer/tests/test_tokenization.py +294 -0
machine_dialect/lexer/tests/test_underscore_literals.py +343 -0
machine_dialect/lexer/tests/test_url_literals.py +169 -0
machine_dialect/lexer/tokens.py +487 -0
machine_dialect/linter/__init__.py +10 -0
machine_dialect/linter/__main__.py +144 -0
machine_dialect/linter/linter.py +154 -0
machine_dialect/linter/rules/__init__.py +8 -0
machine_dialect/linter/rules/base.py +112 -0
machine_dialect/linter/rules/statement_termination.py +99 -0
machine_dialect/linter/tests/__init__.py +1 -0
machine_dialect/linter/tests/mdrules/__init__.py +0 -0
machine_dialect/linter/tests/mdrules/test_md101_statement_termination.py +181 -0
machine_dialect/linter/tests/test_linter.py +81 -0
machine_dialect/linter/tests/test_rules.py +110 -0
machine_dialect/linter/tests/test_violations.py +71 -0
machine_dialect/linter/violations.py +51 -0
machine_dialect/mir/__init__.py +69 -0
machine_dialect/mir/analyses/__init__.py +20 -0
machine_dialect/mir/analyses/alias_analysis.py +315 -0
machine_dialect/mir/analyses/dominance_analysis.py +49 -0
machine_dialect/mir/analyses/escape_analysis.py +286 -0
machine_dialect/mir/analyses/loop_analysis.py +272 -0
machine_dialect/mir/analyses/tests/test_type_analysis.py +736 -0
machine_dialect/mir/analyses/type_analysis.py +448 -0
machine_dialect/mir/analyses/use_def_chains.py +232 -0
machine_dialect/mir/basic_block.py +385 -0
machine_dialect/mir/dataflow.py +445 -0
machine_dialect/mir/debug_info.py +208 -0
machine_dialect/mir/hir_to_mir.py +1738 -0
machine_dialect/mir/mir_dumper.py +366 -0
machine_dialect/mir/mir_function.py +167 -0
machine_dialect/mir/mir_instructions.py +1877 -0
machine_dialect/mir/mir_interpreter.py +556 -0
machine_dialect/mir/mir_module.py +225 -0
machine_dialect/mir/mir_printer.py +480 -0
machine_dialect/mir/mir_transformer.py +410 -0
machine_dialect/mir/mir_types.py +367 -0
machine_dialect/mir/mir_validation.py +455 -0
machine_dialect/mir/mir_values.py +268 -0
machine_dialect/mir/optimization_config.py +233 -0
machine_dialect/mir/optimization_pass.py +251 -0
machine_dialect/mir/optimization_pipeline.py +355 -0
machine_dialect/mir/optimizations/__init__.py +84 -0
machine_dialect/mir/optimizations/algebraic_simplification.py +733 -0
machine_dialect/mir/optimizations/branch_prediction.py +372 -0
machine_dialect/mir/optimizations/constant_propagation.py +634 -0
machine_dialect/mir/optimizations/cse.py +398 -0
machine_dialect/mir/optimizations/dce.py +288 -0
machine_dialect/mir/optimizations/inlining.py +551 -0
machine_dialect/mir/optimizations/jump_threading.py +487 -0
machine_dialect/mir/optimizations/licm.py +405 -0
machine_dialect/mir/optimizations/loop_unrolling.py +366 -0
machine_dialect/mir/optimizations/strength_reduction.py +422 -0
machine_dialect/mir/optimizations/tail_call.py +207 -0
machine_dialect/mir/optimizations/tests/test_loop_unrolling.py +483 -0
machine_dialect/mir/optimizations/type_narrowing.py +397 -0
machine_dialect/mir/optimizations/type_specialization.py +447 -0
machine_dialect/mir/optimizations/type_specific.py +906 -0
machine_dialect/mir/optimize_mir.py +89 -0
machine_dialect/mir/pass_manager.py +391 -0
machine_dialect/mir/profiling/__init__.py +26 -0
machine_dialect/mir/profiling/profile_collector.py +318 -0
machine_dialect/mir/profiling/profile_data.py +372 -0
machine_dialect/mir/profiling/profile_reader.py +272 -0
machine_dialect/mir/profiling/profile_writer.py +226 -0
machine_dialect/mir/register_allocation.py +302 -0
machine_dialect/mir/reporting/__init__.py +17 -0
machine_dialect/mir/reporting/optimization_reporter.py +314 -0
machine_dialect/mir/reporting/report_formatter.py +289 -0
machine_dialect/mir/ssa_construction.py +342 -0
machine_dialect/mir/tests/__init__.py +1 -0
machine_dialect/mir/tests/test_algebraic_associativity.py +204 -0
machine_dialect/mir/tests/test_algebraic_complex_patterns.py +221 -0
machine_dialect/mir/tests/test_algebraic_division.py +126 -0
machine_dialect/mir/tests/test_algebraic_simplification.py +863 -0
machine_dialect/mir/tests/test_basic_block.py +425 -0
machine_dialect/mir/tests/test_branch_prediction.py +459 -0
machine_dialect/mir/tests/test_call_lowering.py +168 -0
machine_dialect/mir/tests/test_collection_lowering.py +604 -0
machine_dialect/mir/tests/test_cross_block_constant_propagation.py +255 -0
machine_dialect/mir/tests/test_custom_passes.py +166 -0
machine_dialect/mir/tests/test_debug_info.py +285 -0
machine_dialect/mir/tests/test_dict_extraction_lowering.py +192 -0
machine_dialect/mir/tests/test_dictionary_lowering.py +299 -0
machine_dialect/mir/tests/test_double_negation.py +231 -0
machine_dialect/mir/tests/test_escape_analysis.py +233 -0
machine_dialect/mir/tests/test_hir_to_mir.py +465 -0
machine_dialect/mir/tests/test_hir_to_mir_complete.py +389 -0
machine_dialect/mir/tests/test_hir_to_mir_simple.py +130 -0
machine_dialect/mir/tests/test_inlining.py +435 -0
machine_dialect/mir/tests/test_licm.py +472 -0
machine_dialect/mir/tests/test_mir_dumper.py +313 -0
machine_dialect/mir/tests/test_mir_instructions.py +445 -0
machine_dialect/mir/tests/test_mir_module.py +860 -0
machine_dialect/mir/tests/test_mir_printer.py +387 -0
machine_dialect/mir/tests/test_mir_types.py +123 -0
machine_dialect/mir/tests/test_mir_types_enhanced.py +132 -0
machine_dialect/mir/tests/test_mir_validation.py +378 -0
machine_dialect/mir/tests/test_mir_values.py +168 -0
machine_dialect/mir/tests/test_one_based_indexing.py +202 -0
machine_dialect/mir/tests/test_optimization_helpers.py +60 -0
machine_dialect/mir/tests/test_optimization_pipeline.py +554 -0
machine_dialect/mir/tests/test_optimization_reporter.py +318 -0
machine_dialect/mir/tests/test_pass_manager.py +294 -0
machine_dialect/mir/tests/test_pass_registration.py +64 -0
machine_dialect/mir/tests/test_profiling.py +356 -0
machine_dialect/mir/tests/test_register_allocation.py +307 -0
machine_dialect/mir/tests/test_report_formatters.py +372 -0
machine_dialect/mir/tests/test_ssa_construction.py +433 -0
machine_dialect/mir/tests/test_tail_call.py +236 -0
machine_dialect/mir/tests/test_type_annotated_instructions.py +192 -0
machine_dialect/mir/tests/test_type_narrowing.py +277 -0
machine_dialect/mir/tests/test_type_specialization.py +421 -0
machine_dialect/mir/tests/test_type_specific_optimization.py +545 -0
machine_dialect/mir/tests/test_type_specific_optimization_advanced.py +382 -0
machine_dialect/mir/type_inference.py +368 -0
machine_dialect/parser/__init__.py +12 -0
machine_dialect/parser/enums.py +45 -0
machine_dialect/parser/parser.py +3655 -0
machine_dialect/parser/protocols.py +11 -0
machine_dialect/parser/symbol_table.py +169 -0
machine_dialect/parser/tests/__init__.py +0 -0
machine_dialect/parser/tests/helper_functions.py +193 -0
machine_dialect/parser/tests/test_action_statements.py +334 -0
machine_dialect/parser/tests/test_boolean_literal_expressions.py +152 -0
machine_dialect/parser/tests/test_call_statements.py +154 -0
machine_dialect/parser/tests/test_call_statements_errors.py +187 -0
machine_dialect/parser/tests/test_collection_mutations.py +264 -0
machine_dialect/parser/tests/test_conditional_expressions.py +343 -0
machine_dialect/parser/tests/test_define_integration.py +468 -0
machine_dialect/parser/tests/test_define_statements.py +311 -0
machine_dialect/parser/tests/test_dict_extraction.py +115 -0
machine_dialect/parser/tests/test_empty_literal.py +155 -0
machine_dialect/parser/tests/test_float_literal_expressions.py +163 -0
machine_dialect/parser/tests/test_identifier_expressions.py +57 -0
machine_dialect/parser/tests/test_if_empty_block.py +61 -0
machine_dialect/parser/tests/test_if_statements.py +299 -0
machine_dialect/parser/tests/test_illegal_tokens.py +86 -0
machine_dialect/parser/tests/test_infix_expressions.py +680 -0
machine_dialect/parser/tests/test_integer_literal_expressions.py +137 -0
machine_dialect/parser/tests/test_interaction_statements.py +269 -0
machine_dialect/parser/tests/test_list_literals.py +277 -0
machine_dialect/parser/tests/test_no_none_in_ast.py +94 -0
machine_dialect/parser/tests/test_panic_mode_recovery.py +171 -0
machine_dialect/parser/tests/test_parse_errors.py +114 -0
machine_dialect/parser/tests/test_possessive_syntax.py +182 -0
machine_dialect/parser/tests/test_prefix_expressions.py +415 -0
machine_dialect/parser/tests/test_program.py +13 -0
machine_dialect/parser/tests/test_return_statements.py +89 -0
machine_dialect/parser/tests/test_set_statements.py +152 -0
machine_dialect/parser/tests/test_strict_equality.py +258 -0
machine_dialect/parser/tests/test_symbol_table.py +217 -0
machine_dialect/parser/tests/test_url_literal_expressions.py +209 -0
machine_dialect/parser/tests/test_utility_statements.py +423 -0
machine_dialect/parser/token_buffer.py +159 -0
machine_dialect/repl/__init__.py +3 -0
machine_dialect/repl/repl.py +426 -0
machine_dialect/repl/tests/__init__.py +0 -0
machine_dialect/repl/tests/test_repl.py +606 -0
machine_dialect/semantic/__init__.py +12 -0
machine_dialect/semantic/analyzer.py +906 -0
machine_dialect/semantic/error_messages.py +189 -0
machine_dialect/semantic/tests/__init__.py +1 -0
machine_dialect/semantic/tests/test_analyzer.py +364 -0
machine_dialect/semantic/tests/test_error_messages.py +104 -0
machine_dialect/tests/edge_cases/__init__.py +10 -0
machine_dialect/tests/edge_cases/test_boundary_access.py +256 -0
machine_dialect/tests/edge_cases/test_empty_collections.py +166 -0
machine_dialect/tests/edge_cases/test_invalid_operations.py +243 -0
machine_dialect/tests/edge_cases/test_named_list_edge_cases.py +295 -0
machine_dialect/tests/edge_cases/test_nested_structures.py +313 -0
machine_dialect/tests/edge_cases/test_type_mixing.py +277 -0
machine_dialect/tests/integration/test_array_operations_emulation.py +248 -0
machine_dialect/tests/integration/test_list_compilation.py +395 -0
machine_dialect/tests/integration/test_lists_and_dictionaries.py +322 -0
machine_dialect/type_checking/__init__.py +21 -0
machine_dialect/type_checking/tests/__init__.py +1 -0
machine_dialect/type_checking/tests/test_type_system.py +230 -0
machine_dialect/type_checking/type_system.py +270 -0
machine_dialect-0.1.0a1.dist-info/METADATA +128 -0
machine_dialect-0.1.0a1.dist-info/RECORD +268 -0
machine_dialect-0.1.0a1.dist-info/WHEEL +5 -0
machine_dialect-0.1.0a1.dist-info/entry_points.txt +3 -0
machine_dialect-0.1.0a1.dist-info/licenses/LICENSE +201 -0
machine_dialect-0.1.0a1.dist-info/top_level.txt +2 -0
machine_dialect_vm/__init__.pyi +15 -0

machine_dialect/agent/agent.py ADDED Viewed

@@ -0,0 +1,360 @@
+"""AI Agent for iterative Machine Dialect™ code generation and execution."""
+import tempfile
+import time
+from dataclasses import dataclass
+from pathlib import Path
+from typing import Any
+from machine_dialect.cfg.openai_generation import generate_with_openai
+from machine_dialect.compiler import Compiler, CompilerConfig
+from machine_dialect.compiler.config import OptimizationLevel
+@dataclass
+class AgentResult:
+    """Result from agent execution.
+    Attributes:
+        success: Whether the task was successfully completed.
+        iterations: Number of iterations taken.
+        code: Final code (if successful).
+        output: Program output (if any).
+        history: Full iteration history.
+    """
+    success: bool
+    iterations: int
+    code: str | None = None
+    output: str | None = None
+    history: list[dict[str, Any]] | None = None
+class Agent:
+    """Iterative AI agent for Machine Dialect™ code generation."""
+    def __init__(self, client: Any, model: str = "gpt-5", verbose: bool = True):
+        """Initialize the agent.
+        Args:
+            client: OpenAI client instance.
+            model: Model to use for generation.
+            verbose: Whether to print progress.
+        """
+        self.client = client
+        self.model = model
+        self.verbose = verbose
+        self.iterations: list[dict[str, Any]] = []
+        self.total_tokens_used = 0
+    def solve(self, task: str, max_iterations: int = 5) -> AgentResult:
+        """Solve a task through iterative code generation.
+        Args:
+            task: The task description.
+            max_iterations: Maximum iterations to attempt.
+        Returns:
+            AgentResult with solution details.
+        """
+        # Track overall time
+        start_time = time.time()
+        if self.verbose:
+            print(f"🤖 Agent starting: {task}")
+            print(f"   Model: {self.model}")
+            print(f"   Max iterations: {max_iterations}")
+        self.iterations = []
+        current_task = task
+        successful_code = None
+        final_output = None
+        for i in range(max_iterations):
+            iteration_num = i + 1
+            if self.verbose:
+                print(f"\n📍 Iteration {iteration_num}/{max_iterations}")
+            # Generate code
+            try:
+                if self.verbose:
+                    print("   Generating code...")
+                # Time the generation
+                gen_start = time.time()
+                code, token_info = self._generate(current_task)
+                gen_time = time.time() - gen_start
+                # Track token usage
+                if token_info:
+                    total = token_info.get("total_tokens", 0)
+                    prompt = token_info.get("prompt_tokens")
+                    completion = token_info.get("completion_tokens")
+                    if total:
+                        self.total_tokens_used += total
+                    if self.verbose:
+                        print(f"   ✓ Code generated (CFG-constrained) in {gen_time:.2f}s")
+                        # Display token info based on what's available
+                        if prompt is not None and completion is not None:
+                            print(f"   📊 Tokens: {prompt} prompt + {completion} completion = {total} total")
+                        elif total:
+                            print(f"   📊 Tokens: {total} total")
+                        if self.total_tokens_used > 0:
+                            print(f"   📈 Cumulative: {self.total_tokens_used:,} tokens")
+                        # Debug: show what was generated
+                        print(f"   Debug: Generated code: {code!r}")
+                else:
+                    if self.verbose:
+                        print("   ✓ Code generated (CFG-constrained)")
+                        print(f"   Debug: Generated code: {code!r}")
+            except Exception as e:
+                if self.verbose:
+                    print(f"   ✗ Generation failed: {e}")
+                self.iterations.append(
+                    {"iteration": iteration_num, "code": None, "error": str(e), "phase": "generation"}
+                )
+                continue
+            # Compile and execute
+            result = self._execute(code)
+            # Record iteration
+            self.iterations.append({"iteration": iteration_num, "code": code, "result": result})
+            # Check result
+            if result["success"]:
+                if self.verbose:
+                    output_msg = result.get("output", "No output")
+                    if result.get("instructions"):
+                        print(f"   ✅ Success! Output: {output_msg}")
+                        print(f"   📊 Executed {result['instructions']} instructions")
+                    else:
+                        print(f"   ✅ Success! Output: {output_msg}")
+                successful_code = code
+                final_output = result.get("output")
+                # Optional: Try to optimize if we have iterations left
+                if iteration_num < max_iterations and self.verbose:
+                    if not self._should_optimize(task, code, result):
+                        break
+                    current_task = f"Optimize this working solution for: {task}\n\nCurrent code:\n{code}"
+                else:
+                    break
+            else:
+                # Failed - prepare for next iteration
+                error = result.get("error", "Unknown error")
+                phase = result.get("phase", "execution")
+                if self.verbose:
+                    print(f"   ❌ {phase.capitalize()} error: {error}")
+                # Build feedback for next iteration
+                current_task = self._build_error_feedback(task, code, error, phase)
+        # Calculate total time
+        total_time = time.time() - start_time
+        # Print final summary
+        if self.verbose:
+            if self.total_tokens_used > 0:
+                print(f"\n💰 Total: {self.total_tokens_used:,} tokens in {total_time:.2f}s")
+            else:
+                print(f"\n⏱️ Total time: {total_time:.2f}s")
+        # Return final result
+        return AgentResult(
+            success=successful_code is not None,
+            iterations=len(self.iterations),
+            code=successful_code,
+            output=final_output,
+            history=self.iterations,
+        )
+    def _generate(self, task: str) -> tuple[str, dict[str, int]]:
+        """Generate code using CFG constraints.
+        Args:
+            task: Task description with any feedback.
+        Returns:
+            Tuple of (code, token_info) where token_info contains usage stats.
+        """
+        # Simplify the task description if it's too complex
+        simplified_task = self._simplify_task(task)
+        # Use the existing CFG generation
+        return generate_with_openai(
+            self.client,
+            self.model,
+            simplified_task,
+            max_tokens=800,
+            temperature=0.7,  # Will be ignored for GPT-5
+        )
+    def _simplify_task(self, task: str) -> str:
+        """Simplify complex task descriptions for better generation.
+        Args:
+            task: Original task description.
+        Returns:
+            Simplified task description.
+        """
+        # Remove overly complex instructions and focus on core functionality
+        simplified = task
+        # If task is very long, try to extract the essential parts
+        if len(task) > 500:
+            # Look for key phrases that indicate the main task
+            lines = task.split("\n")
+            essential_lines = []
+            for line in lines:
+                # Keep lines that describe the main task or errors
+                if any(
+                    keyword in line.lower()
+                    for keyword in [
+                        "generate",
+                        "create",
+                        "calculate",
+                        "implement",
+                        "write",
+                        "error:",
+                        "failed:",
+                        "fix",
+                        "please",
+                    ]
+                ):
+                    essential_lines.append(line)
+            if essential_lines:
+                simplified = "\n".join(essential_lines[:10])  # Limit to 10 most relevant lines
+        # Add clarification about Machine Dialect™ syntax
+        if "error" not in simplified.lower():
+            simplified += (
+                "\nNote: Use Machine Dialect™ syntax with backticks for variables and underscores for literals."
+            )
+        return simplified
+    def _execute(self, code: str) -> dict[str, Any]:
+        """Compile and execute Machine Dialect™ code.
+        Args:
+            code: The code to execute.
+        Returns:
+            Execution result dictionary.
+        """
+        temp_path = None
+        try:
+            # Compile without optimizations
+            config = CompilerConfig(optimization_level=OptimizationLevel.NONE, verbose=False)
+            compiler = Compiler(config)
+            if self.verbose:
+                print("   Compiling...")
+            context = compiler.compile_string(code, module_name="agent_task")
+            # Check compilation errors
+            if context.has_errors():
+                error_msg = "Compilation failed"
+                if context.errors:
+                    error = context.errors[0]
+                    # Convert error object to string
+                    error_msg = str(error)
+                return {"success": False, "phase": "compilation", "error": error_msg}
+            if self.verbose and context.bytecode_module:
+                bytecode_size = len(context.bytecode_module.serialize())
+                print(f"   ✓ Compiled successfully ({bytecode_size} bytes)")
+            # Save bytecode to temporary file
+            if context.bytecode_module:
+                with tempfile.NamedTemporaryFile(suffix=".mdbc", delete=False) as f:
+                    bytecode = context.bytecode_module.serialize()
+                    f.write(bytecode)
+                    temp_path = f.name
+            else:
+                raise ValueError("Compilation succeeded but no bytecode generated")
+            # Execute with Rust VM
+            if self.verbose:
+                print("   Executing bytecode...")
+            import machine_dialect_vm
+            vm = machine_dialect_vm.RustVM()
+            vm.load_bytecode(temp_path)
+            output = vm.execute()
+            # Get instruction count
+            instructions = vm.instruction_count()
+            return {
+                "success": True,
+                "phase": "runtime",
+                "output": str(output) if output is not None else "",
+                "instructions": instructions,
+                "bytecode_size": len(bytecode),
+            }
+        except ImportError:
+            return {"success": False, "phase": "runtime", "error": "Rust VM not available. Run ./build_vm.sh first."}
+        except Exception as e:
+            return {"success": False, "phase": "runtime", "error": str(e)}
+        finally:
+            # Clean up temp file
+            if temp_path:
+                Path(temp_path).unlink(missing_ok=True)
+    def _build_error_feedback(self, original_task: str, code: str, error: str, phase: str) -> str:
+        """Build task description with error feedback.
+        Args:
+            original_task: Original task description.
+            code: Code that failed.
+            error: Error message.
+            phase: Phase where error occurred.
+        Returns:
+            Enhanced task description for retry.
+        """
+        feedback = f"{original_task}\n\n"
+        feedback += f"Previous attempt failed during {phase}:\n"
+        feedback += f"Code:\n```\n{code}\n```\n\n"
+        feedback += f"Error: {error}\n\n"
+        feedback += "Please fix this error and provide a working solution."
+        return feedback
+    def _should_optimize(self, task: str, code: str, result: dict[str, Any]) -> bool:
+        """Decide if we should try to optimize working code.
+        Args:
+            task: Original task.
+            code: Working code.
+            result: Execution result.
+        Returns:
+            Whether to attempt optimization.
+        """
+        # Simple heuristic: don't optimize if it's already very small
+        if result.get("instructions", 0) < 50:
+            return False
+        # Could add more sophisticated logic here
+        return False  # For now, stop on first success

machine_dialect/ast/__init__.py ADDED Viewed

@@ -0,0 +1,95 @@
+# isort: skip_file
+from .ast_node import ASTNode
+from .expressions import (
+    Arguments,
+    CollectionAccessExpression,
+    ConditionalExpression,
+    ErrorExpression,
+    Expression,
+    Identifier,
+    InfixExpression,
+    PrefixExpression,
+)
+from .dict_extraction import DictExtraction
+from .statements import (
+    ActionStatement,
+    BlockStatement,
+    CallStatement,
+    CollectionMutationStatement,
+    DefineStatement,
+    ErrorStatement,
+    ExpressionStatement,
+    ForEachStatement,
+    FunctionStatement,
+    FunctionVisibility,
+    IfStatement,
+    InteractionStatement,
+    Output,
+    Parameter,
+    ReturnStatement,
+    SayStatement,
+    SetStatement,
+    Statement,
+    UtilityStatement,
+    WhileStatement,
+)
+from .program import Program
+from .literals import (
+    WholeNumberLiteral,
+    FloatLiteral,
+    StringLiteral,
+    YesNoLiteral,
+    EmptyLiteral,
+    URLLiteral,
+    UnorderedListLiteral,
+    OrderedListLiteral,
+    NamedListLiteral,
+    BlankLiteral,
+)
+from .call_expression import CallExpression
+__all__ = [
+    "ASTNode",
+    "ActionStatement",
+    "Arguments",
+    "BlankLiteral",
+    "BlockStatement",
+    "CallExpression",
+    "CallStatement",
+    "CollectionAccessExpression",
+    "CollectionMutationStatement",
+    "ConditionalExpression",
+    "DefineStatement",
+    "DictExtraction",
+    "EmptyLiteral",
+    "ErrorExpression",
+    "ErrorStatement",
+    "Expression",
+    "ExpressionStatement",
+    "FloatLiteral",
+    "ForEachStatement",
+    "FunctionStatement",
+    "FunctionVisibility",
+    "Identifier",
+    "IfStatement",
+    "InfixExpression",
+    "InteractionStatement",
+    "NamedListLiteral",
+    "OrderedListLiteral",
+    "Output",
+    "Parameter",
+    "PrefixExpression",
+    "Program",
+    "ReturnStatement",
+    "SayStatement",
+    "SetStatement",
+    "Statement",
+    "StringLiteral",
+    "URLLiteral",
+    "UnorderedListLiteral",
+    "UtilityStatement",
+    "WhileStatement",
+    "WholeNumberLiteral",
+    "YesNoLiteral",
+]

machine_dialect/ast/ast_node.py ADDED Viewed

@@ -0,0 +1,35 @@
+from abc import ABC, abstractmethod
+from typing import TYPE_CHECKING
+if TYPE_CHECKING:
+    from machine_dialect.lexer.tokens import Token
+class ASTNode(ABC):
+    @abstractmethod
+    def __str__(self) -> str:
+        pass
+    def desugar(self) -> "ASTNode":
+        """Simplify AST node for IR generation and optimization.
+        This method transforms the AST to remove syntactic sugar and normalize
+        semantically equivalent constructs. The default implementation returns
+        the node unchanged.
+        Returns:
+            A simplified version of this node or self if no simplification needed.
+        """
+        return self
+    def get_source_location(self) -> tuple[int, int] | None:
+        """Get the source location (line, column) of this AST node.
+        Returns:
+            A tuple of (line, column) if location info is available, None otherwise.
+        """
+        # Default implementation - subclasses with tokens can override
+        if hasattr(self, "token"):
+            token: Token = self.token
+            return (token.line, token.position)
+        return None

machine_dialect/ast/call_expression.py ADDED Viewed

@@ -0,0 +1,82 @@
+"""CallExpression AST node for function calls that return values."""
+from __future__ import annotations
+from typing import TYPE_CHECKING
+from machine_dialect.ast.expressions import Expression
+if TYPE_CHECKING:
+    from machine_dialect.lexer import Token
+class CallExpression(Expression):
+    """A function call expression that returns a value.
+    CallExpression represents a function invocation that produces a value,
+    used in contexts where an expression is expected (e.g., in assignments
+    with 'using', or as part of larger expressions).
+    This is distinct from CallStatement, which represents standalone function
+    calls that don't necessarily return values.
+    Attributes:
+        function_name: The identifier or expression that names the function.
+        arguments: Optional Arguments node containing the function arguments.
+    """
+    def __init__(
+        self, token: Token, function_name: Expression | None = None, arguments: Expression | None = None
+    ) -> None:
+        """Initialize a CallExpression node.
+        Args:
+            token: The token that begins the call (typically the function name).
+            function_name: The expression identifying the function to call.
+            arguments: Optional Arguments node containing the function arguments.
+        """
+        super().__init__(token)
+        self.function_name = function_name
+        self.arguments = arguments
+    def token_literal(self) -> str:
+        """Return the literal value of the call token.
+        Returns:
+            The literal value of the token.
+        """
+        return self.token.literal
+    def __str__(self) -> str:
+        """Return string representation of the call expression.
+        Returns:
+            A string showing the function call with its arguments.
+        """
+        parts = []
+        if self.function_name:
+            parts.append(str(self.function_name))
+        if self.arguments:
+            parts.append(f"({self.arguments})")
+        else:
+            parts.append("()")
+        return "".join(parts)
+    def desugar(self) -> CallExpression:
+        """Desugar the call expression.
+        Returns:
+            A new CallExpression with desugared components.
+        """
+        desugared = CallExpression(self.token)
+        if self.function_name:
+            desugared.function_name = self.function_name.desugar()
+        if self.arguments:
+            desugared.arguments = self.arguments.desugar()
+        return desugared

machine_dialect/ast/dict_extraction.py ADDED Viewed

@@ -0,0 +1,60 @@
+"""Dictionary extraction expressions for Machine Dialect™."""
+from __future__ import annotations
+from typing import TYPE_CHECKING
+from machine_dialect.ast.expressions import Expression
+if TYPE_CHECKING:
+    from machine_dialect.lexer.tokens import Token
+class DictExtraction(Expression):
+    """Extract keys or values from a dictionary.
+    Represents expressions like:
+    - the names of `person` (extracts keys)
+    - the contents of `person` (extracts values)
+    Attributes:
+        dictionary: The dictionary expression to extract from.
+        extract_type: What to extract ('names' for keys, 'contents' for values).
+        token: The token that begins this expression.
+    """
+    def __init__(self, token: Token, dictionary: Expression, extract_type: str) -> None:
+        """Initialize dictionary extraction expression.
+        Args:
+            token: The token that begins this expression.
+            dictionary: The dictionary to extract from.
+            extract_type: 'names' or 'contents'.
+        """
+        super().__init__(token)
+        self.token = token
+        self.dictionary = dictionary
+        self.extract_type = extract_type
+    def __str__(self) -> str:
+        """Return string representation."""
+        if self.extract_type == "names":
+            return f"the names of {self.dictionary}"
+        else:
+            return f"the contents of {self.dictionary}"
+    def desugar(self) -> DictExtraction:
+        """Desugar by recursively desugaring the dictionary."""
+        return DictExtraction(
+            self.token,
+            self.dictionary.desugar() if hasattr(self.dictionary, "desugar") else self.dictionary,
+            self.extract_type,
+        )
+    def to_hir(self) -> DictExtraction:
+        """Convert to HIR representation."""
+        return DictExtraction(
+            self.token,
+            self.dictionary.to_hir() if hasattr(self.dictionary, "to_hir") else self.dictionary,
+            self.extract_type,
+        )