PyPI - janus-llm - Versions diffs - 4.3.5__py3-none-any.whl → 4.4.5__py3-none-any.whl - Mend

janus-llm 4.3.5py3-none-any.whl → 4.4.5py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (30) hide show

janus/__init__.py +1 -1
janus/cli/aggregate.py +2 -2
janus/cli/cli.py +6 -0
janus/cli/constants.py +6 -0
janus/cli/diagram.py +36 -7
janus/cli/document.py +10 -1
janus/cli/llm.py +7 -3
janus/cli/partition.py +10 -1
janus/cli/pipeline.py +123 -0
janus/cli/self_eval.py +1 -3
janus/cli/translate.py +10 -1
janus/converter/_tests/test_translate.py +5 -5
janus/converter/chain.py +180 -0
janus/converter/converter.py +333 -78
janus/converter/diagram.py +8 -6
janus/converter/document.py +7 -3
janus/converter/evaluate.py +140 -148
janus/converter/partition.py +2 -10
janus/converter/requirements.py +4 -40
janus/converter/translate.py +2 -58
janus/language/block.py +31 -2
janus/metrics/metric.py +47 -124
janus/parsers/reqs_parser.py +3 -3
{janus_llm-4.3.5.dist-info → janus_llm-4.4.5.dist-info}/METADATA +12 -12
{janus_llm-4.3.5.dist-info → janus_llm-4.4.5.dist-info}/RECORD +28 -28
janus/metrics/_tests/test_llm.py +0 -90
janus/metrics/llm_metrics.py +0 -202
{janus_llm-4.3.5.dist-info → janus_llm-4.4.5.dist-info}/LICENSE +0 -0
{janus_llm-4.3.5.dist-info → janus_llm-4.4.5.dist-info}/WHEEL +0 -0
{janus_llm-4.3.5.dist-info → janus_llm-4.4.5.dist-info}/entry_points.txt +0 -0

janus/converter/document.py CHANGED Viewed

@@ -19,7 +19,7 @@ class Documenter(Converter):
     ):
         kwargs.update(source_language=source_language)
         super().__init__(**kwargs)
-        self.set_prompt("document")
+        self.set_prompts("document")
         if drop_comments:
             comment_node_type = LANGUAGES[source_language].get(
@@ -33,10 +33,12 @@ class Documenter(Converter):
 class MultiDocumenter(Documenter):
     def __init__(self, **kwargs):
         super().__init__(**kwargs)
-        self.set_prompt("multidocument")
+        self.set_prompts("multidocument")
         self._combiner = JsonCombiner()
         self._parser = MultiDocumentationParser()
+        self._load_parameters()
 class ClozeDocumenter(Documenter):
     def __init__(
@@ -46,12 +48,14 @@ class ClozeDocumenter(Documenter):
     ) -> None:
         kwargs.update(drop_comments=False)
         super().__init__(**kwargs)
-        self.set_prompt("document_cloze")
+        self.set_prompts("document_cloze")
         self._combiner = JsonCombiner()
         self._parser = ClozeDocumentationParser()
         self.comments_per_request = comments_per_request
+        self._load_parameters()
     def _add_translation(self, block: TranslatedCodeBlock):
         if block.translated:
             return

janus/converter/evaluate.py CHANGED Viewed

@@ -1,15 +1,15 @@
 import json
 import re
 from copy import deepcopy
+from pathlib import Path
+from typing import Any
 from langchain_core.runnables import Runnable, RunnableLambda, RunnableParallel
 from janus.converter.converter import Converter
-from janus.language.block import TranslatedCodeBlock
 from janus.language.combine import JsonCombiner
 from janus.parsers.eval_parsers.incose_parser import IncoseParser
 from janus.parsers.eval_parsers.inline_comment_parser import InlineCommentParser
-from janus.parsers.parser import JanusParserException
 from janus.utils.logger import create_logger
 log = create_logger(__name__)
@@ -35,6 +35,7 @@ class Evaluator(Converter):
             model_arguments: Additional arguments to pass to the LLM constructor.
             max_prompts: The maximum number of prompts to try before giving up.
         """
+        kwargs.update(use_janus_inputs=True)
         super().__init__(**kwargs)
         self._combiner = JsonCombiner()
         self._load_parameters()
@@ -62,7 +63,7 @@ class RequirementEvaluator(Evaluator):
         super().__init__(**kwargs)
         self.eval_items_per_request = eval_items_per_request
         self._parser = IncoseParser()
-        self.set_prompt("eval_prompts/incose")
+        self.set_prompts("eval_prompts/incose")
     def _input_runnable(self) -> Runnable:
         def _get_code(json_text: str) -> str:
@@ -77,76 +78,55 @@ class RequirementEvaluator(Evaluator):
             context=self._retriever,
         )
-    def _add_translation(self, block: TranslatedCodeBlock):
-        if block.translated:
-            return
-        if block.original.text is None:
-            block.translated = True
-            return
-        if self.eval_items_per_request is None:
-            return super()._add_translation(block)
-        input_obj = json.loads(block.original.text)
-        requirements = input_obj.get("requirements", [])
-        if not requirements:
-            log.debug(f"[{block.name}] Skipping empty block")
-            block.translated = True
-            block.text = None
-            block.complete = True
-            return
-        # For some reason requirements objects are in nested lists?
-        while isinstance(requirements[0], list):
-            requirements = [r for lst in requirements for r in lst]
-        if len(requirements) <= self.eval_items_per_request:
-            input_obj["requirements"] = requirements
-            block.original.text = json.dumps(input_obj)
-            return super()._add_translation(block)
-        block.processing_time = 0
-        block.cost = 0
-        obj = {}
-        for i in range(0, len(requirements), self.eval_items_per_request):
-            # Build a new TranslatedBlock using the new working text
-            working_requirements = requirements[i : i + self.eval_items_per_request]
-            working_copy = deepcopy(block.original)
-            working_obj = json.loads(working_copy.text)  # type: ignore
-            working_obj["requirements"] = working_requirements
-            working_copy.text = json.dumps(working_obj)
-            working_block = TranslatedCodeBlock(working_copy, self._target_language)
-            # Run the LLM on the working text
-            try:
-                super()._add_translation(working_block)
-            except JanusParserException as e:
-                block.text += "\n==============\n" + working_block.text
-                block.tokens = self._llm.get_num_tokens(block.text)
-                raise e
-            finally:
-                # Update metadata to include for all runs
-                block.num_requests += working_block.num_requests
-                block.cost += working_block.cost
-                block.processing_time += working_block.processing_time
-                block.request_input_tokens += working_block.request_input_tokens
-                block.request_output_tokens += working_block.request_output_tokens
-            # Update the output text to merge this section's output in
-            obj.update(json.loads(working_block.text))
-            # intermediate result of block,
-            # will be overwritten if file completes successfully
-            block.text = json.dumps(obj)
-        block.text = json.dumps(obj)
-        block.tokens = self._llm.get_num_tokens(block.text)
-        block.translated = True
-        log.debug(
-            f"[{block.name}] Output code:\n{json.dumps(json.loads(block.text), indent=2)}"
-        )
+    def translate_janus_obj(self, obj: Any, name: str, failure_path: Path | None = None):
+        results = []
+        for o in obj["outputs"]:
+            if isinstance(o, dict):
+                results += self.translate_janus_obj(o, name, failure_path)
+            elif isinstance(o, str):
+                temp_obj = deepcopy(obj)
+                requirements = json.loads(o)
+                if not requirements:
+                    log.debug(f"[{name}] Skipping empty output")
+                    continue
+                if (
+                    not self.eval_items_per_request
+                    or len(requirements) < self.eval_items_per_request
+                ):
+                    obj_str = json.dumps(
+                        dict(
+                            requirements=requirements,
+                            code=obj["input"],
+                        )
+                    )
+                    temp_obj["outputs"] = [obj_str]
+                    temp_block = self._janus_object_to_codeblock(temp_obj, name)
+                    translated_block = self.translate_block(temp_block, failure_path)
+                    translated_block.previous_generations[-1] = obj
+                    translated_block.original = self._janus_object_to_codeblock(obj, name)
+                    results.append(translated_block)
+                else:
+                    for i in range(0, len(requirements), self.eval_items_per_request):
+                        working_requirements = requirements[
+                            i : i + self.eval_items_per_request
+                        ]
+                        obj_str = json.dumps(
+                            dict(
+                                requirements=working_requirements,
+                                code=obj["input"],
+                            )
+                        )
+                        temp_obj["outputs"] = [obj_str]
+                        temp_block = self._janus_object_to_codeblock(temp_obj, name)
+                        translated_block = self.translate_block(temp_block, failure_path)
+                        translated_block.previous_generations[-1] = obj
+                        translated_block.original = self._janus_object_to_codeblock(
+                            obj, name
+                        )
+                        results.append(translated_block)
+            else:
+                raise ValueError(f"Error: unable to find janus object: {type(o)}")
+        return results
 class InlineCommentEvaluator(Evaluator):
@@ -167,82 +147,94 @@ class InlineCommentEvaluator(Evaluator):
         """
         super().__init__(**kwargs)
         self._combiner = JsonCombiner()
-        self._load_parameters()
         self._parser = InlineCommentParser()
-        self.set_prompt("eval_prompts/inline_comments")
+        self.set_prompts("eval_prompts/inline_comments")
         self.eval_items_per_request = eval_items_per_request
+        self._load_parameters()
-    def _add_translation(self, block: TranslatedCodeBlock):
-        if block.translated:
-            return
-        if block.original.text is None:
-            block.translated = True
-            return
-        if self.eval_items_per_request is None:
-            return super()._add_translation(block)
+    def _process_comments(self, input_str: str, generated_comments: dict[str, str]):
+        comment_patterns = [
+            (r"<BLOCK_COMMENT (\w{8})>", "<BLOCK_COMMENT {}>", "<BLOCK_COMMENT {}>"),
+            (r"<INLINE_COMMENT (\w{8})>", "<INLINE_COMMENT {}>", "<INLINE_COMMENT {}>"),
+            (r"<MODULE (\w{8})>", "<MODULE {}>", "<BLOCK_COMMENT {}>"),
+        ]
+        missing_comments = 0
+        for pattern, find_template, repl_template in comment_patterns:
+            matches = re.findall(pattern, input_str)
+            for comment_id in matches:
+                find_tag = find_template.format(comment_id)
+                repl_tag = repl_template.format(comment_id)
+                if comment_id not in generated_comments:
+                    missing_comments += 1
+                comment = generated_comments.get(comment_id, "[comment missing]")
+                comment = comment.replace("\n", "\\n")
+                # Replace the tag in the code with the comment appended.
+                input_str = input_str.replace(find_tag, f"{repl_tag} {comment}")
+        processed_str = re.sub(r"\s*<JANUS_PARTITION>\s*\n", "\n", input_str)
+        return processed_str.strip("\n"), missing_comments
+    def translate_janus_obj(self, obj: Any, name: str, failure_path: Path | None = None):
         comment_pattern = r"<(?:INLINE|BLOCK)_COMMENT \w{8}>.*$"
-        comments = list(
-            re.finditer(comment_pattern, block.original.text, flags=re.MULTILINE)
-        )
-        if not comments:
-            log.info(f"[{block.name}] Skipping commentless block")
-            block.translated = True
-            block.text = None
-            block.complete = True
-            return
-        if len(comments) <= self.eval_items_per_request:
-            return super()._add_translation(block)
-        comment_group_indices = list(range(0, len(comments), self.eval_items_per_request))
-        log.debug(
-            f"[{block.name}] Block contains more than {self.eval_items_per_request}"
-            f" comments, splitting {len(comments)} comments into"
-            f" {len(comment_group_indices)} groups"
-        )
-        block.processing_time = 0
-        block.cost = 0
-        block.retries = 0
-        obj = {}
-        for i in range(0, len(comments), self.eval_items_per_request):
-            # Split the text into the section containing comments of interest,
-            #  all the text prior to those comments, and all the text after them
-            working_comments = comments[i : i + self.eval_items_per_request]
-            start_idx = working_comments[0].start()
-            end_idx = working_comments[-1].end()
-            prefix = block.original.text[:start_idx]
-            keeper = block.original.text[start_idx:end_idx]
-            suffix = block.original.text[end_idx:]
-            # Strip all comment placeholders outside of the section of interest
-            prefix = re.sub(comment_pattern, "", prefix, flags=re.MULTILINE)
-            suffix = re.sub(comment_pattern, "", suffix, flags=re.MULTILINE)
-            # Build a new TranslatedBlock using the new working text
-            working_copy = deepcopy(block.original)
-            working_copy.text = prefix + keeper + suffix
-            working_block = TranslatedCodeBlock(working_copy, self._target_language)
-            # Run the LLM on the working text
-            super()._add_translation(working_block)
-            # Update metadata to include for all runs
-            block.retries += working_block.retries
-            block.cost += working_block.cost
-            block.processing_time += working_block.processing_time
-            # Update the output text to merge this section's output in
-            obj.update(json.loads(working_block.text))
-        block.text = json.dumps(obj)
-        block.tokens = self._llm.get_num_tokens(block.text)
-        block.translated = True
-        log.debug(
-            f"[{block.name}] Output code:\n{json.dumps(json.loads(block.text), indent=2)}"
-        )
+        results = []
+        input_str = obj["input"]
+        for o in obj["outputs"]:
+            if isinstance(o, dict):
+                results += self.translate_janus_obj(o, name, failure_path)
+            elif isinstance(o, str):
+                temp_obj = deepcopy(obj)
+                generated_comments = json.loads(o)
+                processed_input, missing_comments = self._process_comments(
+                    input_str, generated_comments
+                )
+                if missing_comments:
+                    log.info(f"[{name}] Warning: missing {missing_comments} comments")
+                comments = list(
+                    re.finditer(comment_pattern, processed_input, flags=re.MULTILINE)
+                )
+                if not comments:
+                    log.info(f"[{name}] Skipping commentless block")
+                    continue
+                if (
+                    self.eval_items_per_request is None
+                    or len(comments) < self.eval_items_per_request
+                ):
+                    temp_obj["outputs"] = [processed_input]
+                    temp_block = self._janus_object_to_codeblock(temp_obj, name)
+                    translated_block = self.translate_block(temp_block, failure_path)
+                    translated_block.previous_generations[-1] = obj
+                    translated_block.original = self._janus_object_to_codeblock(obj, name)
+                    results.append(translated_block)
+                    continue
+                comment_group_indices = list(
+                    range(0, len(comments), self.eval_items_per_request)
+                )
+                log.debug(
+                    f"[{name}] Block contains more than {self.eval_items_per_request}"
+                    f" comments, splitting {len(comments)} comments into"
+                    f" {len(comment_group_indices)} groups"
+                )
+                for comment_ind in comment_group_indices:
+                    working_comments = comments[
+                        comment_ind : comment_ind + self.eval_items_per_request
+                    ]
+                    start_idx = working_comments[0].start()
+                    end_idx = working_comments[-1].end()
+                    prefix = processed_input[:start_idx]
+                    keeper = processed_input[start_idx:end_idx]
+                    suffix = processed_input[end_idx:]
+                    # Strip all comment placeholders outside of the section of interest
+                    prefix = re.sub(comment_pattern, "", prefix, flags=re.MULTILINE)
+                    suffix = re.sub(comment_pattern, "", suffix, flags=re.MULTILINE)
+                    temp_obj["outputs"] = [prefix + keeper + suffix]
+                    temp_block = self._janus_object_to_codeblock(temp_obj, name)
+                    translated_block = self.translate_block(temp_block, failure_path)
+                    translated_block.previous_generations[-1] = obj
+                    translated_block.original = self._janus_object_to_codeblock(obj, name)
+                    results.append(translated_block)
+            else:
+                raise ValueError(f"Error: unrecognized janus object type: {type(o)}")
+        return results

janus/converter/partition.py CHANGED Viewed

@@ -1,7 +1,4 @@
-from pathlib import Path
 from janus.converter.converter import Converter
-from janus.language.block import TranslatedCodeBlock
 from janus.parsers.partition_parser import PartitionParser
 from janus.utils.logger import create_logger
@@ -11,17 +8,12 @@ log = create_logger(__name__)
 class Partitioner(Converter):
     def __init__(self, partition_token_limit: int, **kwargs):
         super().__init__(**kwargs)
-        self.set_prompt("partition")
+        self.set_prompts("partition")
         self._load_model()
         self._parser = PartitionParser(
             token_limit=partition_token_limit,
             model=self._llm,
         )
         self._target_language = self._source_language
-        self._target_suffix = self._source_suffix
+        self._target_suffix = self._source_suffixes[0]
         self._load_parameters()
-    def _save_to_file(self, block: TranslatedCodeBlock, out_path: Path) -> None:
-        output_str = self._parser.parse_combined_output(block.complete_text)
-        out_path.parent.mkdir(parents=True, exist_ok=True)
-        out_path.write_text(output_str, encoding="utf-8")

janus/converter/requirements.py CHANGED Viewed

@@ -1,8 +1,4 @@
-import json
-from pathlib import Path
 from janus.converter.document import Documenter
-from janus.language.block import TranslatedCodeBlock
 from janus.language.combine import ChunkCombiner
 from janus.parsers.reqs_parser import RequirementsParser
 from janus.utils.logger import create_logger
@@ -16,41 +12,9 @@ class RequirementsDocumenter(Documenter):
     A class that translates code from one programming language to its requirements.
     """
-    def __init__(self, **kwargs):
-        super().__init__(**kwargs)
-        self.set_prompt("requirements")
+    def __init__(self, combine_output: bool = False, **kwargs):
+        super().__init__(combine_output=combine_output, **kwargs)
+        self.set_prompts("requirements")
         self._combiner = ChunkCombiner()
         self._parser = RequirementsParser()
-    @staticmethod
-    def get_prompt_replacements(block) -> dict[str, str]:
-        prompt_replacements: dict[str, str] = {"SOURCE_CODE": block.original.text}
-        return prompt_replacements
-    def _save_to_file(self, block: TranslatedCodeBlock, out_path: Path) -> None:
-        """Save a file to disk.
-        Arguments:
-            block: The `CodeBlock` to save to a file.
-        """
-        output_list = list()
-        # For each chunk of code, get generation metadata, the text of the code,
-        # and the LLM generated requirements
-        blocks = [block for block in block.children] if len(block.children) else [block]
-        for block in blocks:
-            code = block.original.text
-            requirements = self._parser.parse_combined_output(block.complete_text)
-            metadata = dict(
-                retries=block.total_retries,
-                cost=block.total_cost,
-                processing_time=block.processing_time,
-            )
-            # Put them all in a top level 'output' key
-            output_list.append(
-                dict(metadata=metadata, code=code, requirements=requirements)
-            )
-        obj = dict(
-            output=output_list,
-        )
-        out_path.parent.mkdir(parents=True, exist_ok=True)
-        out_path.write_text(json.dumps(obj, indent=2), encoding="utf-8")
+        self._load_parameters()

janus/converter/translate.py CHANGED Viewed

@@ -1,8 +1,5 @@
 from janus.converter.converter import Converter, run_if_changed
-from janus.llm.models_info import MODEL_PROMPT_ENGINES
 from janus.parsers.code_parser import CodeParser
-from janus.prompts.prompt import SAME_OUTPUT
-from janus.utils.enums import LANGUAGES
 from janus.utils.logger import create_logger
 log = create_logger(__name__)
@@ -29,13 +26,11 @@ class Translator(Converter):
             max_prompts: The maximum number of prompts to try before giving up.
             max_tokens: The maximum number of tokens the model will take in.
                 If unspecificed, model's default max will be used.
-            prompt_template: name of prompt template directory
-                (see janus/prompts/templates) or path to a directory.
+            prompt_templates: name of prompt template directories
+                (see janus/prompts/templates) or paths to directories.
         """
         super().__init__(**kwargs)
-        self._target_version: str | None
         self.set_target_language(
             target_language=target_language,
             target_version=target_version,
@@ -47,57 +42,6 @@ class Translator(Converter):
         self._load_parser()
         super()._load_parameters()
-    def set_target_language(
-        self, target_language: str, target_version: str | None
-    ) -> None:
-        """Validate and set the target language.
-        The affected objects will not be updated until translate() is called.
-        Arguments:
-            target_language: The target programming language.
-            target_version: The target version of the target programming language.
-        """
-        target_language = target_language.lower()
-        if target_language not in LANGUAGES:
-            raise ValueError(
-                f"Invalid target language: {target_language}. "
-                "Valid target languages are found in `janus.utils.enums.LANGUAGES`."
-            )
-        self._target_language = target_language
-        self._target_version = target_version
-        # Taking the first suffix as the default for output files
-        self._target_suffix = f".{LANGUAGES[target_language]['suffixes'][0]}"
-    @run_if_changed(
-        "_prompt_template_name",
-        "_source_language",
-        "_target_language",
-        "_target_version",
-        "_model_name",
-    )
-    def _load_prompt(self) -> None:
-        """Load the prompt according to this instance's attributes.
-        If the relevant fields have not been changed since the last time this
-        method was called, nothing happens.
-        """
-        if self._prompt_template_name in SAME_OUTPUT:
-            if self._target_language != self._source_language:
-                raise ValueError(
-                    f"Prompt template ({self._prompt_template_name}) suggests "
-                    f"source and target languages should match, but do not "
-                    f"({self._source_language} != {self._target_language})"
-                )
-        prompt_engine = MODEL_PROMPT_ENGINES[self._llm.short_model_id](
-            source_language=self._source_language,
-            target_language=self._target_language,
-            target_version=self._target_version,
-            prompt_template=self._prompt_template_name,
-        )
-        self._prompt = prompt_engine.prompt
     @run_if_changed("_target_language")
     def _load_parser(self) -> None:
         """Load the parser according to this instance's attributes.

janus/language/block.py CHANGED Viewed

@@ -46,6 +46,7 @@ class CodeBlock:
         embedding_id: Optional[str] = None,
         affixes: Tuple[str, str] = ("", ""),
         context_tags: dict[str, str] = {},
+        previous_generations: list["TranslatedCodeBlock"] = [],
     ) -> None:
         self.id: Hashable = id
         self.name: Optional[str] = name
@@ -65,6 +66,7 @@ class CodeBlock:
         self.complete = True
         self.omit_prefix = True
         self.omit_suffix = False
+        self.previous_generations = previous_generations
         if self.children:
             self.children[0].omit_prefix = False
@@ -210,15 +212,16 @@ class TranslatedCodeBlock(CodeBlock):
                 TranslatedCodeBlock(child, language) for child in original.children
             ],
             affixes=original.affixes,
+            previous_generations=original.previous_generations,
         )
         self.original = original
         self.complete = original.complete
         self.translated = False
-        self.cost = 0.0
+        self.cost = 0
         self.num_requests = 0
         self.tokens = 0
-        self.processing_time = 0.0
+        self.processing_time = 0
         self.request_input_tokens = 0
         self.request_output_tokens = 0
@@ -297,3 +300,29 @@ class TranslatedCodeBlock(CodeBlock):
             if self.original.total_tokens
             else 0
         )
+    def to_codeblock(self) -> CodeBlock:
+        return CodeBlock(
+            id=self.id,
+            name=self.name,
+            node_type=self.node_type,
+            language=self.language,
+            text=self.text,
+            start_point=self.start_point,
+            end_point=self.end_point,
+            start_byte=self.start_byte,
+            end_byte=self.end_byte,
+            embedding_id=self.embedding_id,
+            tokens=self.tokens,
+            children=[child.to_codeblock() for child in self.children],
+            affixes=self.affixes,
+            previous_generations=self.previous_generations + [self],
+        )
+    def __iadd__(self, other):
+        self.cost += other.cost
+        self.num_requests += other.num_requests
+        self.processing_time += other.processing_time
+        self.request_input_tokens += other.request_input_tokens
+        self.request_output_tokens += other.request_output_tokens
+        return self

janus-llm 4.3.5__py3-none-any.whl → 4.4.5__py3-none-any.whl

janus-llm 4.3.5py3-none-any.whl → 4.4.5py3-none-any.whl