PyPI - machine-dialect - Versions diffs - 0.1.0a1__py3-none-any.whl - Mend

machine-dialect 0.1.0a1__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (268) hide show

machine_dialect/__main__.py +667 -0
machine_dialect/agent/__init__.py +5 -0
machine_dialect/agent/agent.py +360 -0
machine_dialect/ast/__init__.py +95 -0
machine_dialect/ast/ast_node.py +35 -0
machine_dialect/ast/call_expression.py +82 -0
machine_dialect/ast/dict_extraction.py +60 -0
machine_dialect/ast/expressions.py +439 -0
machine_dialect/ast/literals.py +309 -0
machine_dialect/ast/program.py +35 -0
machine_dialect/ast/statements.py +1433 -0
machine_dialect/ast/tests/test_ast_string_representation.py +62 -0
machine_dialect/ast/tests/test_boolean_literal.py +29 -0
machine_dialect/ast/tests/test_collection_hir.py +138 -0
machine_dialect/ast/tests/test_define_statement.py +142 -0
machine_dialect/ast/tests/test_desugar.py +541 -0
machine_dialect/ast/tests/test_foreach_desugar.py +245 -0
machine_dialect/cfg/__init__.py +6 -0
machine_dialect/cfg/config.py +156 -0
machine_dialect/cfg/examples.py +221 -0
machine_dialect/cfg/generate_with_ai.py +187 -0
machine_dialect/cfg/openai_generation.py +200 -0
machine_dialect/cfg/parser.py +94 -0
machine_dialect/cfg/tests/__init__.py +1 -0
machine_dialect/cfg/tests/test_cfg_parser.py +252 -0
machine_dialect/cfg/tests/test_config.py +188 -0
machine_dialect/cfg/tests/test_examples.py +391 -0
machine_dialect/cfg/tests/test_generate_with_ai.py +354 -0
machine_dialect/cfg/tests/test_openai_generation.py +256 -0
machine_dialect/codegen/__init__.py +5 -0
machine_dialect/codegen/bytecode_module.py +89 -0
machine_dialect/codegen/bytecode_serializer.py +300 -0
machine_dialect/codegen/opcodes.py +101 -0
machine_dialect/codegen/register_codegen.py +1996 -0
machine_dialect/codegen/symtab.py +208 -0
machine_dialect/codegen/tests/__init__.py +1 -0
machine_dialect/codegen/tests/test_array_operations_codegen.py +295 -0
machine_dialect/codegen/tests/test_bytecode_serializer.py +185 -0
machine_dialect/codegen/tests/test_register_codegen_ssa.py +324 -0
machine_dialect/codegen/tests/test_symtab.py +418 -0
machine_dialect/codegen/vm_serializer.py +621 -0
machine_dialect/compiler/__init__.py +18 -0
machine_dialect/compiler/compiler.py +197 -0
machine_dialect/compiler/config.py +149 -0
machine_dialect/compiler/context.py +149 -0
machine_dialect/compiler/phases/__init__.py +19 -0
machine_dialect/compiler/phases/bytecode_optimization.py +90 -0
machine_dialect/compiler/phases/codegen.py +40 -0
machine_dialect/compiler/phases/hir_generation.py +39 -0
machine_dialect/compiler/phases/mir_generation.py +86 -0
machine_dialect/compiler/phases/optimization.py +110 -0
machine_dialect/compiler/phases/parsing.py +39 -0
machine_dialect/compiler/pipeline.py +143 -0
machine_dialect/compiler/tests/__init__.py +1 -0
machine_dialect/compiler/tests/test_compiler.py +568 -0
machine_dialect/compiler/vm_runner.py +173 -0
machine_dialect/errors/__init__.py +32 -0
machine_dialect/errors/exceptions.py +369 -0
machine_dialect/errors/messages.py +82 -0
machine_dialect/errors/tests/__init__.py +0 -0
machine_dialect/errors/tests/test_expected_token_errors.py +188 -0
machine_dialect/errors/tests/test_name_errors.py +118 -0
machine_dialect/helpers/__init__.py +0 -0
machine_dialect/helpers/stopwords.py +225 -0
machine_dialect/helpers/validators.py +30 -0
machine_dialect/lexer/__init__.py +9 -0
machine_dialect/lexer/constants.py +23 -0
machine_dialect/lexer/lexer.py +907 -0
machine_dialect/lexer/tests/__init__.py +0 -0
machine_dialect/lexer/tests/helpers.py +86 -0
machine_dialect/lexer/tests/test_apostrophe_identifiers.py +122 -0
machine_dialect/lexer/tests/test_backtick_identifiers.py +140 -0
machine_dialect/lexer/tests/test_boolean_literals.py +108 -0
machine_dialect/lexer/tests/test_case_insensitive_keywords.py +188 -0
machine_dialect/lexer/tests/test_comments.py +200 -0
machine_dialect/lexer/tests/test_double_asterisk_keywords.py +127 -0
machine_dialect/lexer/tests/test_lexer_position.py +113 -0
machine_dialect/lexer/tests/test_list_tokens.py +282 -0
machine_dialect/lexer/tests/test_stopwords.py +80 -0
machine_dialect/lexer/tests/test_strict_equality.py +129 -0
machine_dialect/lexer/tests/test_token.py +41 -0
machine_dialect/lexer/tests/test_tokenization.py +294 -0
machine_dialect/lexer/tests/test_underscore_literals.py +343 -0
machine_dialect/lexer/tests/test_url_literals.py +169 -0
machine_dialect/lexer/tokens.py +487 -0
machine_dialect/linter/__init__.py +10 -0
machine_dialect/linter/__main__.py +144 -0
machine_dialect/linter/linter.py +154 -0
machine_dialect/linter/rules/__init__.py +8 -0
machine_dialect/linter/rules/base.py +112 -0
machine_dialect/linter/rules/statement_termination.py +99 -0
machine_dialect/linter/tests/__init__.py +1 -0
machine_dialect/linter/tests/mdrules/__init__.py +0 -0
machine_dialect/linter/tests/mdrules/test_md101_statement_termination.py +181 -0
machine_dialect/linter/tests/test_linter.py +81 -0
machine_dialect/linter/tests/test_rules.py +110 -0
machine_dialect/linter/tests/test_violations.py +71 -0
machine_dialect/linter/violations.py +51 -0
machine_dialect/mir/__init__.py +69 -0
machine_dialect/mir/analyses/__init__.py +20 -0
machine_dialect/mir/analyses/alias_analysis.py +315 -0
machine_dialect/mir/analyses/dominance_analysis.py +49 -0
machine_dialect/mir/analyses/escape_analysis.py +286 -0
machine_dialect/mir/analyses/loop_analysis.py +272 -0
machine_dialect/mir/analyses/tests/test_type_analysis.py +736 -0
machine_dialect/mir/analyses/type_analysis.py +448 -0
machine_dialect/mir/analyses/use_def_chains.py +232 -0
machine_dialect/mir/basic_block.py +385 -0
machine_dialect/mir/dataflow.py +445 -0
machine_dialect/mir/debug_info.py +208 -0
machine_dialect/mir/hir_to_mir.py +1738 -0
machine_dialect/mir/mir_dumper.py +366 -0
machine_dialect/mir/mir_function.py +167 -0
machine_dialect/mir/mir_instructions.py +1877 -0
machine_dialect/mir/mir_interpreter.py +556 -0
machine_dialect/mir/mir_module.py +225 -0
machine_dialect/mir/mir_printer.py +480 -0
machine_dialect/mir/mir_transformer.py +410 -0
machine_dialect/mir/mir_types.py +367 -0
machine_dialect/mir/mir_validation.py +455 -0
machine_dialect/mir/mir_values.py +268 -0
machine_dialect/mir/optimization_config.py +233 -0
machine_dialect/mir/optimization_pass.py +251 -0
machine_dialect/mir/optimization_pipeline.py +355 -0
machine_dialect/mir/optimizations/__init__.py +84 -0
machine_dialect/mir/optimizations/algebraic_simplification.py +733 -0
machine_dialect/mir/optimizations/branch_prediction.py +372 -0
machine_dialect/mir/optimizations/constant_propagation.py +634 -0
machine_dialect/mir/optimizations/cse.py +398 -0
machine_dialect/mir/optimizations/dce.py +288 -0
machine_dialect/mir/optimizations/inlining.py +551 -0
machine_dialect/mir/optimizations/jump_threading.py +487 -0
machine_dialect/mir/optimizations/licm.py +405 -0
machine_dialect/mir/optimizations/loop_unrolling.py +366 -0
machine_dialect/mir/optimizations/strength_reduction.py +422 -0
machine_dialect/mir/optimizations/tail_call.py +207 -0
machine_dialect/mir/optimizations/tests/test_loop_unrolling.py +483 -0
machine_dialect/mir/optimizations/type_narrowing.py +397 -0
machine_dialect/mir/optimizations/type_specialization.py +447 -0
machine_dialect/mir/optimizations/type_specific.py +906 -0
machine_dialect/mir/optimize_mir.py +89 -0
machine_dialect/mir/pass_manager.py +391 -0
machine_dialect/mir/profiling/__init__.py +26 -0
machine_dialect/mir/profiling/profile_collector.py +318 -0
machine_dialect/mir/profiling/profile_data.py +372 -0
machine_dialect/mir/profiling/profile_reader.py +272 -0
machine_dialect/mir/profiling/profile_writer.py +226 -0
machine_dialect/mir/register_allocation.py +302 -0
machine_dialect/mir/reporting/__init__.py +17 -0
machine_dialect/mir/reporting/optimization_reporter.py +314 -0
machine_dialect/mir/reporting/report_formatter.py +289 -0
machine_dialect/mir/ssa_construction.py +342 -0
machine_dialect/mir/tests/__init__.py +1 -0
machine_dialect/mir/tests/test_algebraic_associativity.py +204 -0
machine_dialect/mir/tests/test_algebraic_complex_patterns.py +221 -0
machine_dialect/mir/tests/test_algebraic_division.py +126 -0
machine_dialect/mir/tests/test_algebraic_simplification.py +863 -0
machine_dialect/mir/tests/test_basic_block.py +425 -0
machine_dialect/mir/tests/test_branch_prediction.py +459 -0
machine_dialect/mir/tests/test_call_lowering.py +168 -0
machine_dialect/mir/tests/test_collection_lowering.py +604 -0
machine_dialect/mir/tests/test_cross_block_constant_propagation.py +255 -0
machine_dialect/mir/tests/test_custom_passes.py +166 -0
machine_dialect/mir/tests/test_debug_info.py +285 -0
machine_dialect/mir/tests/test_dict_extraction_lowering.py +192 -0
machine_dialect/mir/tests/test_dictionary_lowering.py +299 -0
machine_dialect/mir/tests/test_double_negation.py +231 -0
machine_dialect/mir/tests/test_escape_analysis.py +233 -0
machine_dialect/mir/tests/test_hir_to_mir.py +465 -0
machine_dialect/mir/tests/test_hir_to_mir_complete.py +389 -0
machine_dialect/mir/tests/test_hir_to_mir_simple.py +130 -0
machine_dialect/mir/tests/test_inlining.py +435 -0
machine_dialect/mir/tests/test_licm.py +472 -0
machine_dialect/mir/tests/test_mir_dumper.py +313 -0
machine_dialect/mir/tests/test_mir_instructions.py +445 -0
machine_dialect/mir/tests/test_mir_module.py +860 -0
machine_dialect/mir/tests/test_mir_printer.py +387 -0
machine_dialect/mir/tests/test_mir_types.py +123 -0
machine_dialect/mir/tests/test_mir_types_enhanced.py +132 -0
machine_dialect/mir/tests/test_mir_validation.py +378 -0
machine_dialect/mir/tests/test_mir_values.py +168 -0
machine_dialect/mir/tests/test_one_based_indexing.py +202 -0
machine_dialect/mir/tests/test_optimization_helpers.py +60 -0
machine_dialect/mir/tests/test_optimization_pipeline.py +554 -0
machine_dialect/mir/tests/test_optimization_reporter.py +318 -0
machine_dialect/mir/tests/test_pass_manager.py +294 -0
machine_dialect/mir/tests/test_pass_registration.py +64 -0
machine_dialect/mir/tests/test_profiling.py +356 -0
machine_dialect/mir/tests/test_register_allocation.py +307 -0
machine_dialect/mir/tests/test_report_formatters.py +372 -0
machine_dialect/mir/tests/test_ssa_construction.py +433 -0
machine_dialect/mir/tests/test_tail_call.py +236 -0
machine_dialect/mir/tests/test_type_annotated_instructions.py +192 -0
machine_dialect/mir/tests/test_type_narrowing.py +277 -0
machine_dialect/mir/tests/test_type_specialization.py +421 -0
machine_dialect/mir/tests/test_type_specific_optimization.py +545 -0
machine_dialect/mir/tests/test_type_specific_optimization_advanced.py +382 -0
machine_dialect/mir/type_inference.py +368 -0
machine_dialect/parser/__init__.py +12 -0
machine_dialect/parser/enums.py +45 -0
machine_dialect/parser/parser.py +3655 -0
machine_dialect/parser/protocols.py +11 -0
machine_dialect/parser/symbol_table.py +169 -0
machine_dialect/parser/tests/__init__.py +0 -0
machine_dialect/parser/tests/helper_functions.py +193 -0
machine_dialect/parser/tests/test_action_statements.py +334 -0
machine_dialect/parser/tests/test_boolean_literal_expressions.py +152 -0
machine_dialect/parser/tests/test_call_statements.py +154 -0
machine_dialect/parser/tests/test_call_statements_errors.py +187 -0
machine_dialect/parser/tests/test_collection_mutations.py +264 -0
machine_dialect/parser/tests/test_conditional_expressions.py +343 -0
machine_dialect/parser/tests/test_define_integration.py +468 -0
machine_dialect/parser/tests/test_define_statements.py +311 -0
machine_dialect/parser/tests/test_dict_extraction.py +115 -0
machine_dialect/parser/tests/test_empty_literal.py +155 -0
machine_dialect/parser/tests/test_float_literal_expressions.py +163 -0
machine_dialect/parser/tests/test_identifier_expressions.py +57 -0
machine_dialect/parser/tests/test_if_empty_block.py +61 -0
machine_dialect/parser/tests/test_if_statements.py +299 -0
machine_dialect/parser/tests/test_illegal_tokens.py +86 -0
machine_dialect/parser/tests/test_infix_expressions.py +680 -0
machine_dialect/parser/tests/test_integer_literal_expressions.py +137 -0
machine_dialect/parser/tests/test_interaction_statements.py +269 -0
machine_dialect/parser/tests/test_list_literals.py +277 -0
machine_dialect/parser/tests/test_no_none_in_ast.py +94 -0
machine_dialect/parser/tests/test_panic_mode_recovery.py +171 -0
machine_dialect/parser/tests/test_parse_errors.py +114 -0
machine_dialect/parser/tests/test_possessive_syntax.py +182 -0
machine_dialect/parser/tests/test_prefix_expressions.py +415 -0
machine_dialect/parser/tests/test_program.py +13 -0
machine_dialect/parser/tests/test_return_statements.py +89 -0
machine_dialect/parser/tests/test_set_statements.py +152 -0
machine_dialect/parser/tests/test_strict_equality.py +258 -0
machine_dialect/parser/tests/test_symbol_table.py +217 -0
machine_dialect/parser/tests/test_url_literal_expressions.py +209 -0
machine_dialect/parser/tests/test_utility_statements.py +423 -0
machine_dialect/parser/token_buffer.py +159 -0
machine_dialect/repl/__init__.py +3 -0
machine_dialect/repl/repl.py +426 -0
machine_dialect/repl/tests/__init__.py +0 -0
machine_dialect/repl/tests/test_repl.py +606 -0
machine_dialect/semantic/__init__.py +12 -0
machine_dialect/semantic/analyzer.py +906 -0
machine_dialect/semantic/error_messages.py +189 -0
machine_dialect/semantic/tests/__init__.py +1 -0
machine_dialect/semantic/tests/test_analyzer.py +364 -0
machine_dialect/semantic/tests/test_error_messages.py +104 -0
machine_dialect/tests/edge_cases/__init__.py +10 -0
machine_dialect/tests/edge_cases/test_boundary_access.py +256 -0
machine_dialect/tests/edge_cases/test_empty_collections.py +166 -0
machine_dialect/tests/edge_cases/test_invalid_operations.py +243 -0
machine_dialect/tests/edge_cases/test_named_list_edge_cases.py +295 -0
machine_dialect/tests/edge_cases/test_nested_structures.py +313 -0
machine_dialect/tests/edge_cases/test_type_mixing.py +277 -0
machine_dialect/tests/integration/test_array_operations_emulation.py +248 -0
machine_dialect/tests/integration/test_list_compilation.py +395 -0
machine_dialect/tests/integration/test_lists_and_dictionaries.py +322 -0
machine_dialect/type_checking/__init__.py +21 -0
machine_dialect/type_checking/tests/__init__.py +1 -0
machine_dialect/type_checking/tests/test_type_system.py +230 -0
machine_dialect/type_checking/type_system.py +270 -0
machine_dialect-0.1.0a1.dist-info/METADATA +128 -0
machine_dialect-0.1.0a1.dist-info/RECORD +268 -0
machine_dialect-0.1.0a1.dist-info/WHEEL +5 -0
machine_dialect-0.1.0a1.dist-info/entry_points.txt +3 -0
machine_dialect-0.1.0a1.dist-info/licenses/LICENSE +201 -0
machine_dialect-0.1.0a1.dist-info/top_level.txt +2 -0
machine_dialect_vm/__init__.pyi +15 -0

machine_dialect/cfg/tests/test_generate_with_ai.py ADDED Viewed

@@ -0,0 +1,354 @@
+"""Tests for the AI-based Machine Dialect™ code generation module."""
+from unittest.mock import MagicMock, Mock, mock_open, patch
+import pytest
+from machine_dialect.cfg.generate_with_ai import generate_code, main
+class TestGenerateCode:
+    """Test the generate_code function."""
+    @patch("machine_dialect.cfg.generate_with_ai.ConfigLoader")
+    @patch("machine_dialect.cfg.generate_with_ai.CFGParser")
+    def test_generate_code_with_valid_config(self, mock_parser_class: Mock, mock_loader_class: Mock) -> None:
+        """Test successful code generation with valid configuration."""
+        # Setup mocks
+        mock_loader = mock_loader_class.return_value
+        mock_config = MagicMock()
+        mock_config.key = "test-api-key"
+        mock_config.model = "gpt-3.5-turbo"
+        mock_loader.load.return_value = mock_config
+        mock_parser = mock_parser_class.return_value
+        mock_parser.validate.return_value = True
+        # Call function
+        result = generate_code(
+            task="calculate area",
+            temperature=0.5,
+            max_tokens=300,
+            validate=True,
+        )
+        # Verify result contains example code
+        assert "Set `width` to" in result
+        assert "Set `height` to" in result
+        assert "Set `area` to" in result
+        # Verify mocks were called
+        mock_loader.load.assert_called_once()
+        mock_parser.validate.assert_called_once()
+    @patch("machine_dialect.cfg.generate_with_ai.ConfigLoader")
+    @patch("machine_dialect.cfg.generate_with_ai.CFGParser")
+    def test_generate_code_with_api_key_override(self, mock_parser_class: Mock, mock_loader_class: Mock) -> None:
+        """Test that API key parameter overrides config."""
+        # Setup mocks
+        mock_loader = mock_loader_class.return_value
+        mock_config = MagicMock()
+        mock_config.key = "config-api-key"
+        mock_config.model = "gpt-3.5-turbo"
+        mock_loader.load.return_value = mock_config
+        mock_parser = mock_parser_class.return_value
+        mock_parser.validate.return_value = True
+        # Call with API key override
+        result = generate_code(
+            task="test task",
+            api_key="override-api-key",
+            validate=True,
+        )
+        # Verify the config was overridden
+        assert mock_config.key == "override-api-key"
+        assert result is not None
+    @patch("machine_dialect.cfg.generate_with_ai.ConfigLoader")
+    @patch("machine_dialect.cfg.generate_with_ai.CFGParser")
+    def test_generate_code_with_model_override(self, mock_parser_class: Mock, mock_loader_class: Mock) -> None:
+        """Test that model parameter overrides config."""
+        # Setup mocks
+        mock_loader = mock_loader_class.return_value
+        mock_config = MagicMock()
+        mock_config.key = "test-api-key"
+        mock_config.model = "gpt-3.5-turbo"
+        mock_loader.load.return_value = mock_config
+        mock_parser = mock_parser_class.return_value
+        mock_parser.validate.return_value = True
+        # Call with model override
+        result = generate_code(
+            task="test task",
+            model="gpt-4",
+            validate=True,
+        )
+        # Verify the config was overridden
+        assert mock_config.model == "gpt-4"
+        assert result is not None
+    @patch("machine_dialect.cfg.generate_with_ai.ConfigLoader")
+    def test_generate_code_missing_api_key(self, mock_loader_class: Mock) -> None:
+        """Test error when API key is not configured."""
+        # Setup mocks - no API key
+        mock_loader = mock_loader_class.return_value
+        mock_config = MagicMock()
+        mock_config.key = None
+        mock_config.model = "gpt-3.5-turbo"
+        mock_loader.load.return_value = mock_config
+        mock_loader.get_error_message.return_value = "Please configure API key"
+        # Should raise ValueError
+        with pytest.raises(ValueError, match="Please configure API key"):
+            generate_code(task="test task")
+    @patch("machine_dialect.cfg.generate_with_ai.ConfigLoader")
+    def test_generate_code_missing_model(self, mock_loader_class: Mock) -> None:
+        """Test error when model is not configured."""
+        # Setup mocks - no model
+        mock_loader = mock_loader_class.return_value
+        mock_config = MagicMock()
+        mock_config.key = "test-api-key"
+        mock_config.model = None
+        mock_loader.load.return_value = mock_config
+        mock_loader.get_error_message.return_value = "Please configure model"
+        # Should raise ValueError
+        with pytest.raises(ValueError, match="No AI model configured"):
+            generate_code(task="test task")
+    @patch("machine_dialect.cfg.generate_with_ai.ConfigLoader")
+    @patch("machine_dialect.cfg.generate_with_ai.CFGParser")
+    @patch("builtins.print")
+    def test_generate_code_without_validation(
+        self, mock_print: Mock, mock_parser_class: Mock, mock_loader_class: Mock
+    ) -> None:
+        """Test code generation without validation."""
+        # Setup mocks
+        mock_loader = mock_loader_class.return_value
+        mock_config = MagicMock()
+        mock_config.key = "test-api-key"
+        mock_config.model = "gpt-3.5-turbo"
+        mock_loader.load.return_value = mock_config
+        mock_parser = mock_parser_class.return_value
+        # Call without validation
+        result = generate_code(
+            task="test task",
+            validate=False,
+        )
+        # Verify parser was not instantiated/called
+        mock_parser.validate.assert_not_called()
+        assert result is not None
+    @patch("machine_dialect.cfg.generate_with_ai.ConfigLoader")
+    @patch("machine_dialect.cfg.generate_with_ai.CFGParser")
+    @patch("builtins.print")
+    def test_generate_code_with_invalid_syntax(
+        self, mock_print: Mock, mock_parser_class: Mock, mock_loader_class: Mock
+    ) -> None:
+        """Test code generation when validation fails."""
+        # Setup mocks
+        mock_loader = mock_loader_class.return_value
+        mock_config = MagicMock()
+        mock_config.key = "test-api-key"
+        mock_config.model = "gpt-3.5-turbo"
+        mock_loader.load.return_value = mock_config
+        mock_parser = mock_parser_class.return_value
+        mock_parser.validate.return_value = False
+        # Call with validation
+        result = generate_code(
+            task="test task",
+            validate=True,
+        )
+        # Verify validation was attempted and failed message printed
+        mock_parser.validate.assert_called_once()
+        # Check that error message was printed
+        print_calls = [str(call) for call in mock_print.call_args_list]
+        assert any("✗ Generated code has syntax errors" in str(call) for call in print_calls)
+        assert result is not None
+    @patch("machine_dialect.cfg.generate_with_ai.ConfigLoader")
+    @patch("machine_dialect.cfg.generate_with_ai.CFGParser")
+    @patch("builtins.print")
+    def test_generate_code_temperature_and_tokens(
+        self, mock_print: Mock, mock_parser_class: Mock, mock_loader_class: Mock
+    ) -> None:
+        """Test that temperature and max_tokens parameters are used."""
+        # Setup mocks
+        mock_loader = mock_loader_class.return_value
+        mock_config = MagicMock()
+        mock_config.key = "test-api-key"
+        mock_config.model = "gpt-4"
+        mock_loader.load.return_value = mock_config
+        mock_parser = mock_parser_class.return_value
+        mock_parser.validate.return_value = True
+        # Call with custom temperature and tokens
+        result = generate_code(
+            task="complex task",
+            temperature=0.2,
+            max_tokens=1000,
+            validate=True,
+        )
+        # Verify parameters were printed
+        print_calls = [str(call) for call in mock_print.call_args_list]
+        assert any("Temperature: 0.2" in str(call) for call in print_calls)
+        assert any("Max tokens: 1000" in str(call) for call in print_calls)
+        assert result is not None
+class TestMain:
+    """Test the main function."""
+    @patch("sys.argv", ["prog", "calculate area"])
+    @patch("machine_dialect.cfg.generate_with_ai.generate_code")
+    def test_main_basic_task(self, mock_generate: Mock) -> None:
+        """Test main with basic task argument."""
+        mock_generate.return_value = "Generated code"
+        result = main()
+        assert result == 0
+        mock_generate.assert_called_once_with(
+            task="calculate area",
+            api_key=None,
+            model=None,
+            temperature=0.7,
+            max_tokens=500,
+            validate=True,
+        )
+    @patch("sys.argv", ["prog", "test task", "--api-key", "my-key", "--model", "gpt-4"])
+    @patch("machine_dialect.cfg.generate_with_ai.generate_code")
+    def test_main_with_overrides(self, mock_generate: Mock) -> None:
+        """Test main with API key and model overrides."""
+        mock_generate.return_value = "Generated code"
+        result = main()
+        assert result == 0
+        mock_generate.assert_called_once_with(
+            task="test task",
+            api_key="my-key",
+            model="gpt-4",
+            temperature=0.7,
+            max_tokens=500,
+            validate=True,
+        )
+    @patch("sys.argv", ["prog", "test task", "--temperature", "0.3", "--max-tokens", "1000"])
+    @patch("machine_dialect.cfg.generate_with_ai.generate_code")
+    def test_main_with_generation_params(self, mock_generate: Mock) -> None:
+        """Test main with temperature and max-tokens parameters."""
+        mock_generate.return_value = "Generated code"
+        result = main()
+        assert result == 0
+        mock_generate.assert_called_once_with(
+            task="test task",
+            api_key=None,
+            model=None,
+            temperature=0.3,
+            max_tokens=1000,
+            validate=True,
+        )
+    @patch("sys.argv", ["prog", "test task", "--no-validate"])
+    @patch("machine_dialect.cfg.generate_with_ai.generate_code")
+    def test_main_without_validation(self, mock_generate: Mock) -> None:
+        """Test main with --no-validate flag."""
+        mock_generate.return_value = "Generated code"
+        result = main()
+        assert result == 0
+        mock_generate.assert_called_once_with(
+            task="test task",
+            api_key=None,
+            model=None,
+            temperature=0.7,
+            max_tokens=500,
+            validate=False,
+        )
+    @patch("sys.argv", ["prog", "test task", "--save", "output.md"])
+    @patch("machine_dialect.cfg.generate_with_ai.generate_code")
+    @patch("builtins.open", new_callable=mock_open)
+    @patch("builtins.print")
+    def test_main_with_save_file(self, mock_print: Mock, mock_file: Mock, mock_generate: Mock) -> None:
+        """Test main with --save option to write to file."""
+        mock_generate.return_value = "Generated code content"
+        result = main()
+        assert result == 0
+        mock_generate.assert_called_once()
+        # Verify file was written
+        mock_file.assert_called_once_with("output.md", "w")
+        mock_file().write.assert_called_once_with("Generated code content")
+        # Verify success message was printed
+        print_calls = [str(call) for call in mock_print.call_args_list]
+        assert any("Code saved to: output.md" in str(call) for call in print_calls)
+    @patch("sys.argv", ["prog", "test task"])
+    @patch("machine_dialect.cfg.generate_with_ai.generate_code")
+    @patch("builtins.print")
+    def test_main_with_exception(self, mock_print: Mock, mock_generate: Mock) -> None:
+        """Test main when generate_code raises an exception."""
+        mock_generate.side_effect = ValueError("API key not configured")
+        result = main()
+        assert result == 1
+        mock_generate.assert_called_once()
+        # Verify error message was printed
+        print_calls = [str(call) for call in mock_print.call_args_list]
+        assert any("Error: API key not configured" in str(call) for call in print_calls)
+    @patch("sys.argv", ["prog", "complex task", "--save", "/invalid/path/file.md"])
+    @patch("machine_dialect.cfg.generate_with_ai.generate_code")
+    @patch("builtins.open", side_effect=OSError("Permission denied"))
+    @patch("builtins.print")
+    def test_main_with_save_error(self, mock_print: Mock, mock_file: Mock, mock_generate: Mock) -> None:
+        """Test main when saving to file fails."""
+        mock_generate.return_value = "Generated code"
+        result = main()
+        assert result == 1
+        mock_generate.assert_called_once()
+        # Verify error message was printed
+        print_calls = [str(call) for call in mock_print.call_args_list]
+        assert any("Error: Permission denied" in str(call) for call in print_calls)
+    def test_main_as_script(self) -> None:
+        """Test that main can be called as a script."""
+        with patch("sys.argv", ["prog", "test"]):
+            with patch("machine_dialect.cfg.generate_with_ai.generate_code") as mock_gen:
+                mock_gen.return_value = "code"
+                # Import and run the module as __main__
+                import machine_dialect.cfg.generate_with_ai as module
+                # Simulate running as script
+                with patch.object(module, "__name__", "__main__"):
+                    # This would normally trigger the if __name__ == "__main__" block
+                    # but we'll call main directly for testing
+                    exit_code = module.main()
+                    assert exit_code == 0

machine_dialect/cfg/tests/test_openai_generation.py ADDED Viewed

@@ -0,0 +1,256 @@
+"""Tests for the grammar-based OpenAI generation module."""
+from unittest.mock import MagicMock
+import pytest
+from machine_dialect.cfg.openai_generation import _get_machine_dialect_cfg, generate_with_openai, validate_model_support
+class TestGenerateWithOpenAI:
+    """Test the grammar-based generate_with_openai function."""
+    def test_gpt5_cfg_generation(self) -> None:
+        """Test generation with GPT-5 using context-free grammar."""
+        # Mock OpenAI client
+        mock_client = MagicMock()
+        mock_response = MagicMock()
+        # Set up the response to have output_text directly (primary path)
+        mock_response.output_text = "Set x to _10_.\nGive back x."
+        # Also set up output as fallback
+        mock_output = MagicMock()
+        mock_output.input = "Set x to _10_.\nGive back x."
+        mock_response.output = [MagicMock(), mock_output]  # First is text, second is tool output
+        mock_client.responses.create.return_value = mock_response
+        result = generate_with_openai(
+            client=mock_client,
+            model="gpt-5",
+            task_description="set x to 10 and display it",
+            max_tokens=200,
+            temperature=0.7,
+        )
+        # Result should be a tuple of (code, token_info)
+        assert isinstance(result, tuple)
+        assert len(result) == 2
+        code, token_info = result
+        assert code == "Set x to _10_.\nGive back x."
+        assert isinstance(token_info, dict)
+        # Verify API call structure
+        call_args = mock_client.responses.create.call_args
+        assert call_args.kwargs["model"] == "gpt-5"
+        # Note: GPT-5 doesn't support max_completion_tokens or temperature
+        assert "max_completion_tokens" not in call_args.kwargs
+        assert "temperature" not in call_args.kwargs
+        assert call_args.kwargs["parallel_tool_calls"] is False
+        # Check that custom tool with CFG was provided
+        tools = call_args.kwargs["tools"]
+        assert len(tools) == 1
+        assert tools[0]["type"] == "custom"
+        assert tools[0]["name"] == "machine_dialect_generator"
+        assert "format" in tools[0]
+        # Check CFG format - now using Lark syntax
+        cfg = tools[0]["format"]
+        assert cfg["type"] == "grammar"
+        assert cfg["syntax"] == "lark"
+        assert "definition" in cfg
+        # The definition is now a Lark grammar string
+        assert isinstance(cfg["definition"], str)
+        assert "start:" in cfg["definition"]
+        assert "statement:" in cfg["definition"]
+    def test_non_gpt5_model_raises_error(self) -> None:
+        """Test that non-GPT-5 models raise an error."""
+        mock_client = MagicMock()
+        with pytest.raises(ValueError, match="does not support context-free grammar"):
+            generate_with_openai(client=mock_client, model="gpt-4o", task_description="test task", max_tokens=100)
+        # Should not have made any API calls
+        mock_client.responses.create.assert_not_called()
+    def test_gpt5_mini_supported(self) -> None:
+        """Test that gpt-5-mini is recognized as supporting CFG."""
+        mock_client = MagicMock()
+        mock_response = MagicMock()
+        # Set up the response to have output_text directly
+        mock_response.output_text = 'Give back _"Hello"_.'
+        # Also set up output as fallback
+        mock_output = MagicMock()
+        mock_output.input = 'Give back _"Hello"_.'
+        mock_response.output = [MagicMock(), mock_output]
+        mock_client.responses.create.return_value = mock_response
+        result = generate_with_openai(
+            client=mock_client, model="gpt-5-mini", task_description="say hello", max_tokens=50
+        )
+        # Result should be a tuple of (code, token_info)
+        assert isinstance(result, tuple)
+        assert len(result) == 2
+        code, token_info = result
+        assert code == 'Give back _"Hello"_.'
+        assert isinstance(token_info, dict)
+        assert mock_client.responses.create.called
+    def test_empty_response_raises_error(self) -> None:
+        """Test that empty response raises ValueError."""
+        mock_client = MagicMock()
+        mock_response = MagicMock()
+        # Make response have no valid attributes
+        mock_response.output_text = None
+        mock_response.output = []  # Empty output
+        mock_client.responses.create.return_value = mock_response
+        with pytest.raises(ValueError, match="Failed to extract valid code"):
+            generate_with_openai(client=mock_client, model="gpt-5", task_description="test task", max_tokens=100)
+    def test_empty_code_raises_error(self) -> None:
+        """Test that empty generated code raises ValueError."""
+        mock_client = MagicMock()
+        mock_response = MagicMock()
+        # Set up response to have empty code
+        mock_response.output_text = ""  # Empty code
+        del mock_response.output  # Remove output attribute
+        mock_client.responses.create.return_value = mock_response
+        with pytest.raises(ValueError, match="Failed to extract valid code"):
+            generate_with_openai(client=mock_client, model="gpt-5", task_description="test task", max_tokens=100)
+    def test_input_messages_structure(self) -> None:
+        """Test that input messages are structured correctly."""
+        mock_client = MagicMock()
+        mock_response = MagicMock()
+        # Set up the response to have output_text directly
+        mock_response.output_text = "test"
+        # Also set up output as fallback
+        mock_output = MagicMock()
+        mock_output.input = "test"
+        mock_response.output = [MagicMock(), mock_output]
+        mock_client.responses.create.return_value = mock_response
+        result = generate_with_openai(
+            client=mock_client, model="gpt-5-nano", task_description="test task", max_tokens=50
+        )
+        assert isinstance(result, tuple)  # Verify it returns a tuple
+        # Get the input messages passed to the API
+        call_args = mock_client.responses.create.call_args
+        messages = call_args.kwargs["input"]
+        assert len(messages) == 2
+        # Developer message
+        assert messages[0]["role"] == "developer"
+        assert "Machine Dialect™ code generator" in messages[0]["content"]
+        assert "context-free grammar" in messages[0]["content"]
+        # User message
+        assert messages[1]["role"] == "user"
+        assert "test task" in messages[1]["content"]
+class TestValidateModelSupport:
+    """Test the validate_model_support function."""
+    def test_gpt5_models_supported(self) -> None:
+        """Test that GPT-5 models are recognized as supported."""
+        assert validate_model_support("gpt-5") is True
+        assert validate_model_support("GPT-5") is True
+        assert validate_model_support("gpt-5-mini") is True
+        assert validate_model_support("GPT-5-MINI") is True
+        assert validate_model_support("gpt-5-nano") is True
+        assert validate_model_support("gpt-5-Nano") is True
+    def test_non_gpt5_models_not_supported(self) -> None:
+        """Test that non-GPT-5 models are not supported."""
+        assert validate_model_support("gpt-4") is False
+        assert validate_model_support("gpt-4o") is False
+        assert validate_model_support("gpt-3.5-turbo") is False
+        assert validate_model_support("claude-3") is False
+        assert validate_model_support("gemini-pro") is False
+    def test_partial_matches(self) -> None:
+        """Test models with GPT-5 in the name are supported."""
+        assert validate_model_support("gpt-5-2025-08-07") is True
+        assert validate_model_support("gpt-5-mini-latest") is True
+        assert validate_model_support("custom-gpt-5-model") is True
+class TestMachineDialectCFG:
+    """Test the Machine Dialect™ CFG structure."""
+    def test_cfg_structure(self) -> None:
+        """Test that the CFG has the correct structure."""
+        cfg = _get_machine_dialect_cfg()
+        # Check top-level structure
+        assert cfg["type"] == "grammar"
+        assert cfg["syntax"] == "lark"  # Now using Lark syntax
+        assert "definition" in cfg
+        # The definition is now a Lark grammar string
+        definition = cfg["definition"]
+        assert isinstance(definition, str)
+        # Check that key rules exist in the Lark grammar
+        assert "start:" in definition or "program:" in definition
+        assert "statement:" in definition
+        assert "set_stmt:" in definition
+        assert "give_back_stmt:" in definition
+        assert "if_stmt:" in definition
+        assert "expression:" in definition
+        # Check that terminals are defined (using new literal patterns)
+        assert "LITERAL_" in definition or "IDENT" in definition
+        assert "IDENTIFIER" in definition
+    def test_lark_grammar_content(self) -> None:
+        """Test that the Lark grammar has expected content."""
+        cfg = _get_machine_dialect_cfg()
+        grammar = cfg["definition"]
+        # Check for statement rules
+        assert "program:" in grammar or "start:" in grammar
+        assert "statement:" in grammar
+        assert "set_stmt" in grammar
+        assert "give_back_stmt" in grammar
+        # Check for set and give back statements
+        assert 'set_stmt: "Set"i identifier "to"i expression' in grammar
+        assert 'give_back_stmt: ("Give"i "back"i | "Gives"i "back"i) expression' in grammar
+        # Check for expression rules
+        assert "expression:" in grammar or "expr:" in grammar
+        assert "or" in grammar.lower()
+        assert "and" in grammar.lower()
+        # Check for comparison operators
+        assert '"<"' in grammar
+        assert '">"' in grammar
+        assert '"equals"i' in grammar or "equals" in grammar.lower()
+        # Check for arithmetic operators
+        assert '"+"' in grammar
+        assert '"-"' in grammar
+        assert '"*"' in grammar
+        assert '"/"' in grammar
+    def test_grammar_terminals(self) -> None:
+        """Test that terminals are properly defined in Lark grammar."""
+        cfg = _get_machine_dialect_cfg()
+        grammar = cfg["definition"]
+        # Check terminal definitions (new pattern with literals)
+        assert "IDENTIFIER" in grammar or "IDENT" in grammar
+        assert "LITERAL_" in grammar  # Check for literal patterns
+        # Check whitespace handling
+        assert "%import common.WS" in grammar
+        assert "%ignore WS" in grammar

machine_dialect/codegen/__init__.py ADDED Viewed

@@ -0,0 +1,5 @@
+"""Bytecode generation for Machine Dialect™."""
+from .bytecode_serializer import BytecodeWriter
+__all__ = ["BytecodeWriter"]