PyPI - janus-llm - Versions diffs - 4.3.1__py3-none-any.whl → 4.3.5__py3-none-any.whl - Mend

janus-llm 4.3.1py3-none-any.whl → 4.3.5py3-none-any.whl

Files changed (128) hide show

janus/__init__.py +1 -1
janus/__main__.py +1 -1
janus/_tests/evaluator_tests/EvalReadMe.md +85 -0
janus/_tests/evaluator_tests/incose_tests/incose_large_test.json +39 -0
janus/_tests/evaluator_tests/incose_tests/incose_small_test.json +17 -0
janus/_tests/evaluator_tests/inline_comment_tests/mumps_inline_comment_test.m +71 -0
janus/_tests/test_cli.py +3 -2
janus/cli/aggregate.py +135 -0
janus/cli/cli.py +111 -0
janus/cli/constants.py +43 -0
janus/cli/database.py +289 -0
janus/cli/diagram.py +178 -0
janus/cli/document.py +174 -0
janus/cli/embedding.py +122 -0
janus/cli/llm.py +187 -0
janus/cli/partition.py +125 -0
janus/cli/self_eval.py +149 -0
janus/cli/translate.py +183 -0
janus/converter/__init__.py +1 -1
janus/converter/_tests/test_translate.py +2 -0
janus/converter/converter.py +129 -93
janus/converter/document.py +21 -14
janus/converter/evaluate.py +20 -13
janus/converter/translate.py +3 -3
janus/embedding/collections.py +1 -1
janus/language/alc/_tests/alc.asm +3779 -0
janus/language/binary/_tests/hello.bin +0 -0
janus/language/block.py +47 -12
janus/language/file.py +1 -1
janus/language/mumps/_tests/mumps.m +235 -0
janus/language/treesitter/_tests/languages/fortran.f90 +416 -0
janus/language/treesitter/_tests/languages/ibmhlasm.asm +16 -0
janus/language/treesitter/_tests/languages/matlab.m +225 -0
janus/llm/models_info.py +9 -1
janus/metrics/_tests/asm_test_file.asm +10 -0
janus/metrics/_tests/mumps_test_file.m +6 -0
janus/metrics/_tests/test_treesitter_metrics.py +1 -1
janus/metrics/prompts/clarity.txt +8 -0
janus/metrics/prompts/completeness.txt +16 -0
janus/metrics/prompts/faithfulness.txt +10 -0
janus/metrics/prompts/hallucination.txt +16 -0
janus/metrics/prompts/quality.txt +8 -0
janus/metrics/prompts/readability.txt +16 -0
janus/metrics/prompts/usefulness.txt +16 -0
janus/parsers/code_parser.py +4 -4
janus/parsers/doc_parser.py +12 -9
janus/parsers/parser.py +7 -0
janus/parsers/partition_parser.py +6 -4
janus/parsers/reqs_parser.py +8 -5
janus/parsers/uml.py +5 -4
janus/prompts/prompt.py +2 -2
janus/prompts/templates/README.md +30 -0
janus/prompts/templates/basic_aggregation/human.txt +6 -0
janus/prompts/templates/basic_aggregation/system.txt +1 -0
janus/prompts/templates/basic_refinement/human.txt +14 -0
janus/prompts/templates/basic_refinement/system.txt +1 -0
janus/prompts/templates/diagram/human.txt +9 -0
janus/prompts/templates/diagram/system.txt +1 -0
janus/prompts/templates/diagram_with_documentation/human.txt +15 -0
janus/prompts/templates/diagram_with_documentation/system.txt +1 -0
janus/prompts/templates/document/human.txt +10 -0
janus/prompts/templates/document/system.txt +1 -0
janus/prompts/templates/document_cloze/human.txt +11 -0
janus/prompts/templates/document_cloze/system.txt +1 -0
janus/prompts/templates/document_cloze/variables.json +4 -0
janus/prompts/templates/document_cloze/variables_asm.json +4 -0
janus/prompts/templates/document_inline/human.txt +13 -0
janus/prompts/templates/eval_prompts/incose/human.txt +32 -0
janus/prompts/templates/eval_prompts/incose/system.txt +1 -0
janus/prompts/templates/eval_prompts/incose/variables.json +3 -0
janus/prompts/templates/eval_prompts/inline_comments/human.txt +49 -0
janus/prompts/templates/eval_prompts/inline_comments/system.txt +1 -0
janus/prompts/templates/eval_prompts/inline_comments/variables.json +3 -0
janus/prompts/templates/micromanaged_mumps_v1.0/human.txt +23 -0
janus/prompts/templates/micromanaged_mumps_v1.0/system.txt +3 -0
janus/prompts/templates/micromanaged_mumps_v2.0/human.txt +28 -0
janus/prompts/templates/micromanaged_mumps_v2.0/system.txt +3 -0
janus/prompts/templates/micromanaged_mumps_v2.1/human.txt +29 -0
janus/prompts/templates/micromanaged_mumps_v2.1/system.txt +3 -0
janus/prompts/templates/multidocument/human.txt +15 -0
janus/prompts/templates/multidocument/system.txt +1 -0
janus/prompts/templates/partition/human.txt +22 -0
janus/prompts/templates/partition/system.txt +1 -0
janus/prompts/templates/partition/variables.json +4 -0
janus/prompts/templates/pseudocode/human.txt +7 -0
janus/prompts/templates/pseudocode/system.txt +7 -0
janus/prompts/templates/refinement/fix_exceptions/human.txt +19 -0
janus/prompts/templates/refinement/fix_exceptions/system.txt +1 -0
janus/prompts/templates/refinement/format/code_format/human.txt +12 -0
janus/prompts/templates/refinement/format/code_format/system.txt +1 -0
janus/prompts/templates/refinement/format/requirements_format/human.txt +14 -0
janus/prompts/templates/refinement/format/requirements_format/system.txt +1 -0
janus/prompts/templates/refinement/hallucination/human.txt +13 -0
janus/prompts/templates/refinement/hallucination/system.txt +1 -0
janus/prompts/templates/refinement/reflection/human.txt +15 -0
janus/prompts/templates/refinement/reflection/incose/human.txt +26 -0
janus/prompts/templates/refinement/reflection/incose/system.txt +1 -0
janus/prompts/templates/refinement/reflection/incose_deduplicate/human.txt +16 -0
janus/prompts/templates/refinement/reflection/incose_deduplicate/system.txt +1 -0
janus/prompts/templates/refinement/reflection/system.txt +1 -0
janus/prompts/templates/refinement/revision/human.txt +16 -0
janus/prompts/templates/refinement/revision/incose/human.txt +16 -0
janus/prompts/templates/refinement/revision/incose/system.txt +1 -0
janus/prompts/templates/refinement/revision/incose_deduplicate/human.txt +17 -0
janus/prompts/templates/refinement/revision/incose_deduplicate/system.txt +1 -0
janus/prompts/templates/refinement/revision/system.txt +1 -0
janus/prompts/templates/refinement/uml/alc_fix_variables/human.txt +15 -0
janus/prompts/templates/refinement/uml/alc_fix_variables/system.txt +2 -0
janus/prompts/templates/refinement/uml/fix_connections/human.txt +15 -0
janus/prompts/templates/refinement/uml/fix_connections/system.txt +2 -0
janus/prompts/templates/requirements/human.txt +13 -0
janus/prompts/templates/requirements/system.txt +2 -0
janus/prompts/templates/retrieval/language_docs/human.txt +10 -0
janus/prompts/templates/retrieval/language_docs/system.txt +1 -0
janus/prompts/templates/simple/human.txt +16 -0
janus/prompts/templates/simple/system.txt +3 -0
janus/refiners/format.py +49 -0
janus/refiners/refiner.py +113 -4
janus/utils/enums.py +127 -112
janus/utils/logger.py +2 -0
{janus_llm-4.3.1.dist-info → janus_llm-4.3.5.dist-info}/METADATA +7 -7
janus_llm-4.3.5.dist-info/RECORD +210 -0
{janus_llm-4.3.1.dist-info → janus_llm-4.3.5.dist-info}/WHEEL +1 -1
janus_llm-4.3.5.dist-info/entry_points.txt +3 -0
janus/cli.py +0 -1488
janus_llm-4.3.1.dist-info/RECORD +0 -115
janus_llm-4.3.1.dist-info/entry_points.txt +0 -3
{janus_llm-4.3.1.dist-info → janus_llm-4.3.5.dist-info}/LICENSE +0 -0

janus/cli.py DELETED Viewed

@@ -1,1488 +0,0 @@
-import json
-import logging
-import os
-import subprocess  # nosec
-from pathlib import Path
-from typing import List, Optional
-import click
-import typer
-from pydantic import AnyHttpUrl
-from rich import print
-from rich.console import Console
-from rich.prompt import Confirm
-from typing_extensions import Annotated
-import janus.refiners.refiner
-import janus.refiners.uml
-from janus.converter.aggregator import Aggregator
-from janus.converter.converter import Converter
-from janus.converter.diagram import DiagramGenerator
-from janus.converter.document import Documenter, MadLibsDocumenter, MultiDocumenter
-from janus.converter.evaluate import InlineCommentEvaluator, RequirementEvaluator
-from janus.converter.partition import Partitioner
-from janus.converter.requirements import RequirementsDocumenter
-from janus.converter.translate import Translator
-from janus.embedding.collections import Collections
-from janus.embedding.database import ChromaEmbeddingDatabase
-from janus.embedding.embedding_models_info import (
-    EMBEDDING_COST_PER_MODEL,
-    EMBEDDING_MODEL_CONFIG_DIR,
-    EMBEDDING_TOKEN_LIMITS,
-    EmbeddingModelType,
-)
-from janus.embedding.vectorize import ChromaDBVectorizer
-from janus.language.binary import BinarySplitter
-from janus.language.mumps import MumpsSplitter
-from janus.language.naive.registry import CUSTOM_SPLITTERS
-from janus.language.treesitter import TreeSitterSplitter
-from janus.llm.model_callbacks import COST_PER_1K_TOKENS
-from janus.llm.models_info import (
-    MODEL_CONFIG_DIR,
-    MODEL_ID_TO_LONG_ID,
-    MODEL_TYPE_CONSTRUCTORS,
-    MODEL_TYPES,
-    TOKEN_LIMITS,
-    azure_models,
-    bedrock_models,
-    openai_models,
-)
-from janus.metrics.cli import evaluate
-from janus.utils.enums import LANGUAGES
-from janus.utils.logger import create_logger
-httpx_logger = logging.getLogger("httpx")
-httpx_logger.setLevel(logging.WARNING)
-log = create_logger(__name__)
-homedir = Path.home().expanduser()
-janus_dir = homedir / ".janus"
-if not janus_dir.exists():
-    janus_dir.mkdir(parents=True)
-db_file = janus_dir / ".db"
-if not db_file.exists():
-    with open(db_file, "w") as f:
-        f.write(str(janus_dir / "chroma.db"))
-with open(db_file, "r") as f:
-    db_loc = f.read()
-collections_config_file = Path(db_loc) / "collections.json"
-def get_subclasses(cls):
-    return set(cls.__subclasses__()).union(
-        set(s for c in cls.__subclasses__() for s in get_subclasses(c))
-    )
-REFINER_TYPES = get_subclasses(janus.refiners.refiner.JanusRefiner).union(
-    {janus.refiners.refiner.JanusRefiner}
-)
-REFINERS = {r.__name__: r for r in REFINER_TYPES}
-def get_collections_config():
-    if collections_config_file.exists():
-        with open(collections_config_file, "r") as f:
-            config = json.load(f)
-    else:
-        config = {}
-    return config
-app = typer.Typer(
-    help=(
-        "[bold][dark_orange]Janus[/dark_orange] is a CLI for translating, "
-        "documenting, and diagramming code using large language models.[/bold]"
-    ),
-    add_completion=False,
-    no_args_is_help=True,
-    context_settings={"help_option_names": ["-h", "--help"]},
-    rich_markup_mode="rich",
-)
-db = typer.Typer(
-    help="Database commands",
-    add_completion=False,
-    no_args_is_help=True,
-    context_settings={"help_option_names": ["-h", "--help"]},
-)
-llm = typer.Typer(
-    help="LLM commands",
-    add_completion=False,
-    no_args_is_help=True,
-    context_settings={"help_option_names": ["-h", "--help"]},
-)
-embedding = typer.Typer(
-    help="Embedding model commands",
-    add_completion=False,
-    no_args_is_help=True,
-    context_settings={"help_option_names": ["-h", "--help"]},
-)
-def version_callback(value: bool) -> None:
-    if value:
-        from . import __version__ as version
-        print(f"Janus CLI [blue]v{version}[/blue]")
-        raise typer.Exit()
-@app.callback()
-def common(
-    ctx: typer.Context,
-    version: bool = typer.Option(
-        None,
-        "--version",
-        "-v",
-        callback=version_callback,
-        help="Print the version and exit.",
-    ),
-) -> None:
-    """A function for getting the app version
-    This will call the version_callback function to print the version and exit.
-    Arguments:
-        ctx: The typer context
-        version: A boolean flag for the version
-    """
-    pass
-@app.command(
-    help="Translate code from one language to another using an LLM.",
-    no_args_is_help=True,
-)
-def translate(
-    input_dir: Annotated[
-        Path,
-        typer.Option(
-            "--input",
-            "-i",
-            help="The directory containing the source code to be translated. "
-            "The files should all be in one flat directory.",
-        ),
-    ],
-    source_lang: Annotated[
-        str,
-        typer.Option(
-            "--source-language",
-            "-s",
-            help="The language of the source code.",
-            click_type=click.Choice(sorted(LANGUAGES)),
-        ),
-    ],
-    output_dir: Annotated[
-        Path,
-        typer.Option(
-            "--output", "-o", help="The directory to store the translated code in."
-        ),
-    ],
-    target_lang: Annotated[
-        str,
-        typer.Option(
-            "--target-language",
-            "-t",
-            help="The desired output language to translate the source code to. The "
-            "format can follow a 'language-version' syntax.  Use 'text' to get plaintext"
-            "results as returned by the LLM. Examples: `python-3.10`, `mumps`, `java-10`,"
-            "text.",
-        ),
-    ],
-    llm_name: Annotated[
-        str,
-        typer.Option(
-            "--llm",
-            "-L",
-            help="The custom name of the model set with 'janus llm add'.",
-        ),
-    ],
-    max_prompts: Annotated[
-        int,
-        typer.Option(
-            "--max-prompts",
-            "-m",
-            help="The maximum number of times to prompt a model on one functional block "
-            "before exiting the application. This is to prevent wasting too much money.",
-        ),
-    ] = 10,
-    overwrite: Annotated[
-        bool,
-        typer.Option(
-            "--overwrite/--preserve",
-            help="Whether to overwrite existing files in the output directory",
-        ),
-    ] = False,
-    skip_context: Annotated[
-        bool,
-        typer.Option(
-            "--skip-context",
-            help="Prompts will include any context information associated with source"
-            " code blocks, unless this option is specified",
-        ),
-    ] = False,
-    temp: Annotated[
-        float,
-        typer.Option("--temperature", "-T", help="Sampling temperature.", min=0, max=2),
-    ] = 0.7,
-    prompt_template: Annotated[
-        str,
-        typer.Option(
-            "--prompt-template",
-            "-p",
-            help="Name of the Janus prompt template directory or "
-            "path to a directory containing those template files.",
-        ),
-    ] = "simple",
-    collection: Annotated[
-        str,
-        typer.Option(
-            "--collection",
-            "-c",
-            help="If set, will put the translated result into a Chroma DB "
-            "collection with the name provided.",
-        ),
-    ] = None,
-    splitter_type: Annotated[
-        str,
-        typer.Option(
-            "-S",
-            "--splitter",
-            help="Name of custom splitter to use",
-            click_type=click.Choice(list(CUSTOM_SPLITTERS.keys())),
-        ),
-    ] = "file",
-    refiner_types: Annotated[
-        list[str],
-        typer.Option(
-            "-r",
-            "--refiner",
-            help="List of refiner types to use. Add -r for each refiner to use in\
-                refinement chain",
-            click_type=click.Choice(list(REFINERS.keys())),
-        ),
-    ] = ["JanusRefiner"],
-    retriever_type: Annotated[
-        str,
-        typer.Option(
-            "-R",
-            "--retriever",
-            help="Name of custom retriever to use",
-            click_type=click.Choice(["active_usings", "language_docs"]),
-        ),
-    ] = None,
-    max_tokens: Annotated[
-        int,
-        typer.Option(
-            "--max-tokens",
-            "-M",
-            help="The maximum number of tokens the model will take in. "
-            "If unspecificed, model's default max will be used.",
-        ),
-    ] = None,
-):
-    refiner_types = [REFINERS[r] for r in refiner_types]
-    try:
-        target_language, target_version = target_lang.split("-")
-    except ValueError:
-        target_language = target_lang
-        target_version = None
-    # make sure not overwriting input
-    if source_lang.lower() == target_language.lower() and input_dir == output_dir:
-        log.error("Output files would overwrite input! Aborting...")
-        raise ValueError
-    model_arguments = dict(temperature=temp)
-    collections_config = get_collections_config()
-    translator = Translator(
-        model=llm_name,
-        model_arguments=model_arguments,
-        source_language=source_lang,
-        target_language=target_language,
-        target_version=target_version,
-        max_prompts=max_prompts,
-        max_tokens=max_tokens,
-        prompt_template=prompt_template,
-        db_path=db_loc,
-        db_config=collections_config,
-        splitter_type=splitter_type,
-        refiner_types=refiner_types,
-        retriever_type=retriever_type,
-    )
-    translator.translate(input_dir, output_dir, overwrite, collection)
-@app.command(
-    help="Document input code using an LLM.",
-    no_args_is_help=True,
-)
-def document(
-    input_dir: Annotated[
-        Path,
-        typer.Option(
-            "--input",
-            "-i",
-            help="The directory containing the source code to be translated. "
-            "The files should all be in one flat directory.",
-        ),
-    ],
-    language: Annotated[
-        str,
-        typer.Option(
-            "--language",
-            "-l",
-            help="The language of the source code.",
-            click_type=click.Choice(sorted(LANGUAGES)),
-        ),
-    ],
-    output_dir: Annotated[
-        Path,
-        typer.Option(
-            "--output-dir", "-o", help="The directory to store the translated code in."
-        ),
-    ],
-    llm_name: Annotated[
-        str,
-        typer.Option(
-            "--llm",
-            "-L",
-            help="The custom name of the model set with 'janus llm add'.",
-        ),
-    ],
-    max_prompts: Annotated[
-        int,
-        typer.Option(
-            "--max-prompts",
-            "-m",
-            help="The maximum number of times to prompt a model on one functional block "
-            "before exiting the application. This is to prevent wasting too much money.",
-        ),
-    ] = 10,
-    overwrite: Annotated[
-        bool,
-        typer.Option(
-            "--overwrite/--preserve",
-            help="Whether to overwrite existing files in the output directory",
-        ),
-    ] = False,
-    doc_mode: Annotated[
-        str,
-        typer.Option(
-            "--doc-mode",
-            "-d",
-            help="The documentation mode.",
-            click_type=click.Choice(["madlibs", "summary", "multidoc", "requirements"]),
-        ),
-    ] = "madlibs",
-    comments_per_request: Annotated[
-        int,
-        typer.Option(
-            "--comments-per-request",
-            "-rc",
-            help="The maximum number of comments to generate per request when using "
-            "MadLibs documentation mode.",
-        ),
-    ] = None,
-    drop_comments: Annotated[
-        bool,
-        typer.Option(
-            "--drop-comments/--keep-comments",
-            help="Whether to drop or keep comments in the code sent to the LLM",
-        ),
-    ] = False,
-    temperature: Annotated[
-        float,
-        typer.Option("--temperature", "-t", help="Sampling temperature.", min=0, max=2),
-    ] = 0.7,
-    collection: Annotated[
-        str,
-        typer.Option(
-            "--collection",
-            "-c",
-            help="If set, will put the translated result into a Chroma DB "
-            "collection with the name provided.",
-        ),
-    ] = None,
-    splitter_type: Annotated[
-        str,
-        typer.Option(
-            "-S",
-            "--splitter",
-            help="Name of custom splitter to use",
-            click_type=click.Choice(list(CUSTOM_SPLITTERS.keys())),
-        ),
-    ] = "file",
-    refiner_types: Annotated[
-        list[str],
-        typer.Option(
-            "-r",
-            "--refiner",
-            help="List of refiner types to use. Add -r for each refiner to use in\
-                refinement chain",
-            click_type=click.Choice(list(REFINERS.keys())),
-        ),
-    ] = ["JanusRefiner"],
-    retriever_type: Annotated[
-        str,
-        typer.Option(
-            "-R",
-            "--retriever",
-            help="Name of custom retriever to use",
-            click_type=click.Choice(["active_usings", "language_docs"]),
-        ),
-    ] = None,
-    max_tokens: Annotated[
-        int,
-        typer.Option(
-            "--max-tokens",
-            "-M",
-            help="The maximum number of tokens the model will take in. "
-            "If unspecificed, model's default max will be used.",
-        ),
-    ] = None,
-):
-    refiner_types = [REFINERS[r] for r in refiner_types]
-    model_arguments = dict(temperature=temperature)
-    collections_config = get_collections_config()
-    kwargs = dict(
-        model=llm_name,
-        model_arguments=model_arguments,
-        source_language=language,
-        max_prompts=max_prompts,
-        max_tokens=max_tokens,
-        db_path=db_loc,
-        db_config=collections_config,
-        splitter_type=splitter_type,
-        refiner_types=refiner_types,
-        retriever_type=retriever_type,
-    )
-    if doc_mode == "madlibs":
-        documenter = MadLibsDocumenter(
-            comments_per_request=comments_per_request, **kwargs
-        )
-    elif doc_mode == "multidoc":
-        documenter = MultiDocumenter(drop_comments=drop_comments, **kwargs)
-    elif doc_mode == "requirements":
-        documenter = RequirementsDocumenter(drop_comments=drop_comments, **kwargs)
-    else:
-        documenter = Documenter(drop_comments=drop_comments, **kwargs)
-    documenter.translate(input_dir, output_dir, overwrite, collection)
-@app.command()
-def aggregate(
-    input_dir: Annotated[
-        Path,
-        typer.Option(
-            "--input",
-            "-i",
-            help="The directory containing the source code to be translated. "
-            "The files should all be in one flat directory.",
-        ),
-    ],
-    language: Annotated[
-        str,
-        typer.Option(
-            "--language",
-            "-l",
-            help="The language of the source code.",
-            click_type=click.Choice(sorted(LANGUAGES)),
-        ),
-    ],
-    output_dir: Annotated[
-        Path,
-        typer.Option(
-            "--output-dir", "-o", help="The directory to store the translated code in."
-        ),
-    ],
-    llm_name: Annotated[
-        str,
-        typer.Option(
-            "--llm",
-            "-L",
-            help="The custom name of the model set with 'janus llm add'.",
-        ),
-    ],
-    max_prompts: Annotated[
-        int,
-        typer.Option(
-            "--max-prompts",
-            "-m",
-            help="The maximum number of times to prompt a model on one functional block "
-            "before exiting the application. This is to prevent wasting too much money.",
-        ),
-    ] = 10,
-    overwrite: Annotated[
-        bool,
-        typer.Option(
-            "--overwrite/--preserve",
-            help="Whether to overwrite existing files in the output directory",
-        ),
-    ] = False,
-    temperature: Annotated[
-        float,
-        typer.Option("--temperature", "-t", help="Sampling temperature.", min=0, max=2),
-    ] = 0.7,
-    collection: Annotated[
-        str,
-        typer.Option(
-            "--collection",
-            "-c",
-            help="If set, will put the translated result into a Chroma DB "
-            "collection with the name provided.",
-        ),
-    ] = None,
-    splitter_type: Annotated[
-        str,
-        typer.Option(
-            "-S",
-            "--splitter",
-            help="Name of custom splitter to use",
-            click_type=click.Choice(list(CUSTOM_SPLITTERS.keys())),
-        ),
-    ] = "file",
-    intermediate_converters: Annotated[
-        List[str],
-        typer.Option(
-            "-C",
-            "--converter",
-            help="Name of an intermediate converter to use",
-            click_type=click.Choice([c.__name__ for c in get_subclasses(Converter)]),
-        ),
-    ] = ["Documenter"],
-):
-    converter_subclasses = get_subclasses(Converter)
-    converter_subclasses_map = {c.__name__: c for c in converter_subclasses}
-    model_arguments = dict(temperature=temperature)
-    collections_config = get_collections_config()
-    converters = []
-    for ic in intermediate_converters:
-        converters.append(
-            converter_subclasses_map[ic](
-                model=llm_name,
-                model_arguments=model_arguments,
-                source_language=language,
-                max_prompts=max_prompts,
-                db_path=db_loc,
-                db_config=collections_config,
-                splitter_type=splitter_type,
-            )
-        )
-    aggregator = Aggregator(
-        intermediate_converters=converters,
-        model=llm_name,
-        model_arguments=model_arguments,
-        source_language=language,
-        max_prompts=max_prompts,
-        db_path=db_loc,
-        db_config=collections_config,
-        splitter_type=splitter_type,
-        prompt_template="basic_aggregation",
-    )
-    aggregator.translate(input_dir, output_dir, overwrite, collection)
-@app.command(
-    help="Partition input code using an LLM.",
-    no_args_is_help=True,
-)
-def partition(
-    input_dir: Annotated[
-        Path,
-        typer.Option(
-            "--input",
-            "-i",
-            help="The directory containing the source code to be partitioned. ",
-        ),
-    ],
-    language: Annotated[
-        str,
-        typer.Option(
-            "--language",
-            "-l",
-            help="The language of the source code.",
-            click_type=click.Choice(sorted(LANGUAGES)),
-        ),
-    ],
-    output_dir: Annotated[
-        Path,
-        typer.Option(
-            "--output-dir", "-o", help="The directory to store the partitioned code in."
-        ),
-    ],
-    llm_name: Annotated[
-        str,
-        typer.Option(
-            "--llm",
-            "-L",
-            help="The custom name of the model set with 'janus llm add'.",
-        ),
-    ] = "gpt-4o",
-    max_prompts: Annotated[
-        int,
-        typer.Option(
-            "--max-prompts",
-            "-m",
-            help="The maximum number of times to prompt a model on one functional block "
-            "before exiting the application. This is to prevent wasting too much money.",
-        ),
-    ] = 10,
-    overwrite: Annotated[
-        bool,
-        typer.Option(
-            "--overwrite/--preserve",
-            help="Whether to overwrite existing files in the output directory",
-        ),
-    ] = False,
-    temperature: Annotated[
-        float,
-        typer.Option("--temperature", "-t", help="Sampling temperature.", min=0, max=2),
-    ] = 0.7,
-    splitter_type: Annotated[
-        str,
-        typer.Option(
-            "-S",
-            "--splitter",
-            help="Name of custom splitter to use",
-            click_type=click.Choice(list(CUSTOM_SPLITTERS.keys())),
-        ),
-    ] = "file",
-    refiner_types: Annotated[
-        list[str],
-        typer.Option(
-            "-r",
-            "--refiner",
-            help="List of refiner types to use. Add -r for each refiner to use in\
-                refinement chain",
-            click_type=click.Choice(list(REFINERS.keys())),
-        ),
-    ] = ["JanusRefiner"],
-    max_tokens: Annotated[
-        int,
-        typer.Option(
-            "--max-tokens",
-            "-M",
-            help="The maximum number of tokens the model will take in. "
-            "If unspecificed, model's default max will be used.",
-        ),
-    ] = None,
-    partition_token_limit: Annotated[
-        int,
-        typer.Option(
-            "--partition-tokens",
-            "-pt",
-            help="The limit on the number of tokens per partition.",
-        ),
-    ] = 8192,
-):
-    refiner_types = [REFINERS[r] for r in refiner_types]
-    model_arguments = dict(temperature=temperature)
-    kwargs = dict(
-        model=llm_name,
-        model_arguments=model_arguments,
-        source_language=language,
-        max_prompts=max_prompts,
-        max_tokens=max_tokens,
-        splitter_type=splitter_type,
-        refiner_types=refiner_types,
-        partition_token_limit=partition_token_limit,
-    )
-    partitioner = Partitioner(**kwargs)
-    partitioner.translate(input_dir, output_dir, overwrite)
-@app.command(
-    help="Diagram input code using an LLM.",
-    no_args_is_help=True,
-)
-def diagram(
-    input_dir: Annotated[
-        Path,
-        typer.Option(
-            "--input",
-            "-i",
-            help="The directory containing the source code to be translated. "
-            "The files should all be in one flat directory.",
-        ),
-    ],
-    language: Annotated[
-        str,
-        typer.Option(
-            "--language",
-            "-l",
-            help="The language of the source code.",
-            click_type=click.Choice(sorted(LANGUAGES)),
-        ),
-    ],
-    output_dir: Annotated[
-        Path,
-        typer.Option(
-            "--output-dir", "-o", help="The directory to store the translated code in."
-        ),
-    ],
-    llm_name: Annotated[
-        str,
-        typer.Option(
-            "--llm",
-            "-L",
-            help="The custom name of the model set with 'janus llm add'.",
-        ),
-    ],
-    max_prompts: Annotated[
-        int,
-        typer.Option(
-            "--max-prompts",
-            "-m",
-            help="The maximum number of times to prompt a model on one functional block "
-            "before exiting the application. This is to prevent wasting too much money.",
-        ),
-    ] = 10,
-    overwrite: Annotated[
-        bool,
-        typer.Option(
-            "--overwrite/--preserve",
-            help="Whether to overwrite existing files in the output directory",
-        ),
-    ] = False,
-    temperature: Annotated[
-        float,
-        typer.Option("--temperature", "-t", help="Sampling temperature.", min=0, max=2),
-    ] = 0.7,
-    collection: Annotated[
-        str,
-        typer.Option(
-            "--collection",
-            "-c",
-            help="If set, will put the translated result into a Chroma DB "
-            "collection with the name provided.",
-        ),
-    ] = None,
-    diagram_type: Annotated[
-        str,
-        typer.Option(
-            "--diagram-type", "-dg", help="Diagram type to generate in PLANTUML"
-        ),
-    ] = "Activity",
-    add_documentation: Annotated[
-        bool,
-        typer.Option(
-            "--add-documentation/--no-documentation",
-            "-ad",
-            help="Whether to use documentation in generation",
-        ),
-    ] = False,
-    splitter_type: Annotated[
-        str,
-        typer.Option(
-            "-S",
-            "--splitter",
-            help="Name of custom splitter to use",
-            click_type=click.Choice(list(CUSTOM_SPLITTERS.keys())),
-        ),
-    ] = "file",
-    refiner_types: Annotated[
-        list[str],
-        typer.Option(
-            "-r",
-            "--refiner",
-            help="List of refiner types to use. Add -r for each refiner to use in\
-                refinement chain",
-            click_type=click.Choice(list(REFINERS.keys())),
-        ),
-    ] = ["JanusRefiner"],
-    retriever_type: Annotated[
-        str,
-        typer.Option(
-            "-R",
-            "--retriever",
-            help="Name of custom retriever to use",
-            click_type=click.Choice(["active_usings", "language_docs"]),
-        ),
-    ] = None,
-):
-    refiner_types = [REFINERS[r] for r in refiner_types]
-    model_arguments = dict(temperature=temperature)
-    collections_config = get_collections_config()
-    diagram_generator = DiagramGenerator(
-        model=llm_name,
-        model_arguments=model_arguments,
-        source_language=language,
-        max_prompts=max_prompts,
-        db_path=db_loc,
-        db_config=collections_config,
-        splitter_type=splitter_type,
-        refiner_types=refiner_types,
-        retriever_type=retriever_type,
-        diagram_type=diagram_type,
-        add_documentation=add_documentation,
-    )
-    diagram_generator.translate(input_dir, output_dir, overwrite, collection)
-@app.command(
-    help="LLM self evaluation",
-    no_args_is_help=True,
-)
-def llm_self_eval(
-    input_dir: Annotated[
-        Path,
-        typer.Option(
-            "--input",
-            "-i",
-            help="The directory containing the source code to be evaluated. "
-            "The files should all be in one flat directory.",
-        ),
-    ],
-    language: Annotated[
-        str,
-        typer.Option(
-            "--language",
-            "-l",
-            help="The language of the source code.",
-            click_type=click.Choice(sorted(LANGUAGES)),
-        ),
-    ],
-    output_dir: Annotated[
-        Path,
-        typer.Option(
-            "--output-dir", "-o", help="The directory to store the evaluations in."
-        ),
-    ],
-    llm_name: Annotated[
-        str,
-        typer.Option(
-            "--llm",
-            "-L",
-            help="The custom name of the model set with 'janus llm add'.",
-        ),
-    ] = "gpt-4o",
-    evaluation_type: Annotated[
-        str,
-        typer.Option(
-            "--evaluation-type",
-            "-e",
-            help="Type of output to evaluate.",
-            click_type=click.Choice(["incose", "comments"]),
-        ),
-    ] = "incose",
-    max_prompts: Annotated[
-        int,
-        typer.Option(
-            "--max-prompts",
-            "-m",
-            help="The maximum number of times to prompt a model on one functional block "
-            "before exiting the application. This is to prevent wasting too much money.",
-        ),
-    ] = 10,
-    overwrite: Annotated[
-        bool,
-        typer.Option(
-            "--overwrite/--preserve",
-            help="Whether to overwrite existing files in the output directory",
-        ),
-    ] = False,
-    temperature: Annotated[
-        float,
-        typer.Option("--temperature", "-t", help="Sampling temperature.", min=0, max=2),
-    ] = 0.7,
-    collection: Annotated[
-        str,
-        typer.Option(
-            "--collection",
-            "-c",
-            help="If set, will put the translated result into a Chroma DB "
-            "collection with the name provided.",
-        ),
-    ] = None,
-    splitter_type: Annotated[
-        str,
-        typer.Option(
-            "-S",
-            "--splitter",
-            help="Name of custom splitter to use",
-            click_type=click.Choice(list(CUSTOM_SPLITTERS.keys())),
-        ),
-    ] = "file",
-    refiner_types: Annotated[
-        list[str],
-        typer.Option(
-            "-r",
-            "--refiner",
-            help="List of refiner types to use. Add -r for each refiner to use in\
-                refinement chain",
-            click_type=click.Choice(list(REFINERS.keys())),
-        ),
-    ] = ["JanusRefiner"],
-    eval_items_per_request: Annotated[
-        int,
-        typer.Option(
-            "--eval-items-per-request",
-            "-rc",
-            help="The maximum number of evaluation items per request",
-        ),
-    ] = None,
-    max_tokens: Annotated[
-        int,
-        typer.Option(
-            "--max-tokens",
-            "-M",
-            help="The maximum number of tokens the model will take in. "
-            "If unspecificed, model's default max will be used.",
-        ),
-    ] = None,
-):
-    model_arguments = dict(temperature=temperature)
-    refiner_types = [REFINERS[r] for r in refiner_types]
-    kwargs = dict(
-        eval_items_per_request=eval_items_per_request,
-        model=llm_name,
-        model_arguments=model_arguments,
-        source_language=language,
-        max_prompts=max_prompts,
-        max_tokens=max_tokens,
-        splitter_type=splitter_type,
-        refiner_types=refiner_types,
-    )
-    # Setting parser type here
-    if evaluation_type == "incose":
-        evaluator = RequirementEvaluator(**kwargs)
-    elif evaluation_type == "comments":
-        evaluator = InlineCommentEvaluator(**kwargs)
-    evaluator.translate(input_dir, output_dir, overwrite, collection)
-@db.command("init", help="Connect to or create a database.")
-def db_init(
-    path: Annotated[
-        str, typer.Option("--path", "-p", help="The path to the database file.")
-    ] = str(janus_dir / "chroma.db"),
-    url: Annotated[
-        str,
-        typer.Option(
-            "--url",
-            "-u",
-            help="The URL of the database if the database is running externally.",
-        ),
-    ] = "",
-) -> None:
-    global db_loc
-    if url != "":
-        print(f"Pointing to Chroma DB at {url}")
-        with open(db_file, "w") as f:
-            f.write(url)
-        db_loc = url
-    else:
-        path = os.path.abspath(path)
-        print(f"Setting up Chroma DB at {path}")
-        with open(db_file, "w") as f:
-            f.write(path)
-        db_loc = path
-    global embedding_db
-    embedding_db = ChromaEmbeddingDatabase(db_loc)
-@db.command("status", help="Print current database location.")
-def db_status():
-    print(f"Chroma DB currently pointing to {db_loc}")
-@db.command(
-    "ls",
-    help="List the current database's collections. Or supply a collection name to list "
-    "information about its contents.",
-)
-def db_ls(
-    collection_name: Annotated[
-        Optional[str], typer.Argument(help="The name of the collection.")
-    ] = None,
-    peek: Annotated[
-        Optional[int],
-        typer.Option("--peek", "-p", help="Peek at N entries for a specific collection."),
-    ] = None,
-) -> None:
-    """List the current database's collections"""
-    if peek is not None and collection_name is None:
-        print(
-            "\n[bold red]Cannot peek at all collections. Please specify a "
-            "collection by name.[/bold red]"
-        )
-        return
-    db = ChromaEmbeddingDatabase(db_loc)
-    collections = Collections(db)
-    collection_list = collections.get(collection_name)
-    for collection in collection_list:
-        print(
-            f"\n[bold underline]Collection[/bold underline]: "
-            f"[bold salmon1]{collection.name}[/bold salmon1]"
-        )
-        print(f"  ID: {collection.id}")
-        print(f"  Metadata: {collection.metadata}")
-        print(f"  Tenant: [green]{collection.tenant}[/green]")
-        print(f"  Database: [green]{collection.database}[/green]")
-        print(f"  Length: {collection.count()}")
-        if peek:
-            entry = collection.peek(peek)
-            entry["embeddings"] = entry["embeddings"][0][:2] + ["..."]
-            if peek == 1:
-                print("  [bold]Peeking at first entry[/bold]:")
-            else:
-                print(f"  [bold]Peeking at first {peek} entries[/bold]:")
-            print(entry)
-        print()
-@db.command("add", help="Add a collection to the current database.")
-def db_add(
-    collection_name: Annotated[str, typer.Argument(help="The name of the collection.")],
-    model_name: Annotated[str, typer.Argument(help="The name of the embedding model.")],
-    input_dir: Annotated[
-        str,
-        typer.Option(
-            "--input",
-            "-i",
-            help="The directory containing the source code to be added.",
-        ),
-    ] = "./",
-    input_lang: Annotated[
-        str, typer.Option("--language", "-l", help="The language of the source code.")
-    ] = "python",
-    max_tokens: Annotated[
-        int,
-        typer.Option(
-            "--max-tokens",
-            "-m",
-            help="The maximum number of tokens for each chunk of input source code.",
-        ),
-    ] = 4096,
-) -> None:
-    """Add a collection to the database
-    Arguments:
-        collection_name: The name of the collection to add
-        model_name: The name of the embedding model to use
-        input_dir: The directory containing the source code to be added
-        input_lang: The language of the source code
-        max_tokens: The maximum number of tokens for each chunk of input source code
-    """
-    # TODO: import factory
-    console = Console()
-    added_to = _check_collection(collection_name, input_dir)
-    collections_config = get_collections_config()
-    with console.status(
-        f"Adding collection: [bold salmon]{collection_name}[/bold salmon]",
-        spinner="arrow3",
-    ):
-        vectorizer_factory = ChromaDBVectorizer()
-        vectorizer = vectorizer_factory.create_vectorizer(
-            path=db_loc, config=collections_config
-        )
-        vectorizer.get_or_create_collection(collection_name, model_name=model_name)
-        input_dir = Path(input_dir)
-        suffix = LANGUAGES[input_lang]["suffix"]
-        source_glob = f"**/*.{suffix}"
-        input_paths = [p for p in input_dir.rglob(source_glob)]
-        if input_lang in CUSTOM_SPLITTERS:
-            if input_lang == "mumps":
-                splitter = MumpsSplitter(
-                    max_tokens=max_tokens,
-                )
-            elif input_lang == "binary":
-                splitter = BinarySplitter(
-                    max_tokens=max_tokens,
-                )
-        else:
-            splitter = TreeSitterSplitter(
-                language=input_lang,
-                max_tokens=max_tokens,
-            )
-        for input_path in input_paths:
-            input_block = splitter.split(input_path)
-            vectorizer.add_nodes_recursively(
-                input_block,
-                collection_name,
-                input_path.name,
-            )
-    total_files = len([p for p in Path.glob(input_dir, "**/*") if not p.is_dir()])
-    if added_to:
-        print(
-            f"\nAdded to [bold salmon1]{collection_name}[/bold salmon1]:\n"
-            f"  Embedding Model: [green]{model_name}[/green]\n"
-            f"  Input Directory: {input_dir.absolute()}\n"
-            f"  {input_lang.capitalize()} [green]*.{suffix}[/green] Files: "
-            f"{len(input_paths)}\n"
-            "  Other Files (skipped): "
-            f"{total_files - len(input_paths)}\n"
-        )
-        [p for p in Path.glob(input_dir, f"**/*.{suffix}") if not p.is_dir()]
-    else:
-        print(
-            f"\nCreated [bold salmon1]{collection_name}[/bold salmon1]:\n"
-            f"  Embedding Model: '{model_name}'\n"
-            f"  Input Directory: {input_dir.absolute()}\n"
-            f"  {input_lang.capitalize()} [green]*.{suffix}[/green] Files: "
-            f"{len(input_paths)}\n"
-            "  Other Files (skipped): "
-            f"{total_files - len(input_paths)}\n"
-        )
-    with open(collections_config_file, "w") as f:
-        json.dump(vectorizer.config, f, indent=2)
-@db.command(
-    "rm",
-    help="Remove a collection from the database.",
-)
-def db_rm(
-    collection_name: Annotated[str, typer.Argument(help="The name of the collection.")],
-    confirm: Annotated[
-        bool,
-        typer.Option(
-            "--yes",
-            "-y",
-            help="Confirm the removal of the collection.",
-        ),
-    ],
-) -> None:
-    """Remove a collection from the database
-    Arguments:
-        collection_name: The name of the collection to remove
-    """
-    if not confirm:
-        delete = Confirm.ask(
-            f"\nAre you sure you want to [bold red]remove[/bold red] "
-            f"[bold salmon1]{collection_name}[/bold salmon1]?",
-        )
-    else:
-        delete = True
-    if not delete:
-        raise typer.Abort()
-    db = ChromaEmbeddingDatabase(db_loc)
-    collections = Collections(db)
-    collections.delete(collection_name)
-    print(
-        f"[bold red]Removed[/bold red] collection "
-        f"[bold salmon1]{collection_name}[/bold salmon1]"
-    )
-def _check_collection(collection_name: str, input_dir: str | Path) -> bool:
-    db = ChromaEmbeddingDatabase(db_loc)
-    collections = Collections(db)
-    added_to = False
-    try:
-        collections.get(collection_name)
-        # confirm_add = Confirm.ask(
-        #     f"\nCollection [bold salmon1]{collection_name}[/bold salmon1] exists. Are "
-        #     "you sure you want to update it with the contents of"
-        #     f"[bold green]{input_dir}[/bold green]?"
-        # )
-        added_to = True
-        # if not confirm_add:
-        #     raise typer.Abort()
-    except ValueError:
-        pass
-    return added_to
-@llm.command("add", help="Add a model config to janus")
-def llm_add(
-    model_name: Annotated[
-        str, typer.Argument(help="The user's custom name of the model")
-    ],
-    model_type: Annotated[
-        str,
-        typer.Option(
-            "--type",
-            "-t",
-            help="The type of the model",
-            click_type=click.Choice(sorted(list(MODEL_TYPE_CONSTRUCTORS.keys()))),
-        ),
-    ] = "Azure",
-):
-    if not MODEL_CONFIG_DIR.exists():
-        MODEL_CONFIG_DIR.mkdir(parents=True)
-    model_cfg = MODEL_CONFIG_DIR / f"{model_name}.json"
-    if model_type == "HuggingFace":
-        url = typer.prompt("Enter the model's URL")
-        max_tokens = typer.prompt(
-            "Enter the model's maximum tokens", default=4096, type=int
-        )
-        in_cost = typer.prompt("Enter the cost per input token", default=0, type=float)
-        out_cost = typer.prompt("Enter the cost per output token", default=0, type=float)
-        params = dict(
-            inference_server_url=url,
-            max_new_tokens=max_tokens,
-            top_k=10,
-            top_p=0.95,
-            typical_p=0.95,
-            temperature=0.01,
-            repetition_penalty=1.03,
-            timeout=240,
-        )
-        cfg = {
-            "model_type": model_type,
-            "model_args": params,
-            "token_limit": max_tokens,
-            "model_cost": {"input": in_cost, "output": out_cost},
-        }
-    elif model_type == "HuggingFaceLocal":
-        model_id = typer.prompt("Enter the model ID")
-        task = typer.prompt("Enter the task")
-        max_tokens = typer.prompt(
-            "Enter the model's maximum tokens", default=4096, type=int
-        )
-        in_cost = 0
-        out_cost = 0
-        params = {"model_id": model_id, "task": task}
-        cfg = {
-            "model_type": model_type,
-            "model_args": params,
-            "token_limit": max_tokens,
-            "model_cost": {"input": in_cost, "output": out_cost},
-        }
-    elif model_type == "OpenAI":
-        print("DEPRECATED: Use 'Azure' instead. CTRL+C to exit.")
-        model_id = typer.prompt(
-            "Enter the model ID (list model IDs with `janus llm ls -a`)",
-            default="gpt-4o",
-            type=click.Choice(openai_models),
-            show_choices=False,
-        )
-        params = dict(
-            model_name=model_name,
-            temperature=0.7,
-            n=1,
-        )
-        max_tokens = TOKEN_LIMITS[model_name]
-        model_cost = COST_PER_1K_TOKENS[model_name]
-        cfg = {
-            "model_type": model_type,
-            "model_id": model_id,
-            "model_args": params,
-            "token_limit": max_tokens,
-            "model_cost": model_cost,
-        }
-    elif model_type == "Azure":
-        model_id = typer.prompt(
-            "Enter the model ID (list model IDs with `janus llm ls -a`)",
-            default="gpt-4o",
-            type=click.Choice(azure_models),
-            show_choices=False,
-        )
-        params = dict(
-            # Azure uses the "azure_deployment" key for what we're calling "long_model_id"
-            azure_deployment=MODEL_ID_TO_LONG_ID[model_id],
-            temperature=0.7,
-            n=1,
-        )
-        max_tokens = TOKEN_LIMITS[MODEL_ID_TO_LONG_ID[model_id]]
-        model_cost = COST_PER_1K_TOKENS[MODEL_ID_TO_LONG_ID[model_id]]
-        cfg = {
-            "model_type": model_type,
-            "model_id": model_id,
-            "model_args": params,
-            "token_limit": max_tokens,
-            "model_cost": model_cost,
-        }
-    elif model_type == "BedrockChat" or model_type == "Bedrock":
-        model_id = typer.prompt(
-            "Enter the model ID (list model IDs with `janus llm ls -a`)",
-            default="bedrock-claude-sonnet",
-            type=click.Choice(bedrock_models),
-            show_choices=False,
-        )
-        params = dict(
-            # Bedrock uses the "model_id" key for what we're calling "long_model_id"
-            model_id=MODEL_ID_TO_LONG_ID[model_id],
-            model_kwargs={"temperature": 0.7},
-        )
-        max_tokens = TOKEN_LIMITS[MODEL_ID_TO_LONG_ID[model_id]]
-        model_cost = COST_PER_1K_TOKENS[MODEL_ID_TO_LONG_ID[model_id]]
-        cfg = {
-            "model_type": model_type,
-            "model_id": model_id,
-            "model_args": params,
-            "token_limit": max_tokens,
-            "model_cost": model_cost,
-        }
-    else:
-        raise ValueError(f"Unknown model type {model_type}")
-    with open(model_cfg, "w") as f:
-        json.dump(cfg, f, indent=2)
-    print(f"Model config written to {model_cfg}")
-@llm.command("ls", help="List all of the user-configured models")
-def llm_ls(
-    all: Annotated[
-        bool,
-        typer.Option(
-            "--all",
-            "-a",
-            is_flag=True,
-            help="List all models, including the default model IDs.",
-            click_type=click.Choice(sorted(list(MODEL_TYPE_CONSTRUCTORS.keys()))),
-        ),
-    ] = False,
-):
-    print("\n[green]User-configured models[/green]:")
-    for model_cfg in MODEL_CONFIG_DIR.glob("*.json"):
-        with open(model_cfg, "r") as f:
-            cfg = json.load(f)
-        print(f"\t[blue]{model_cfg.stem}[/blue]: [purple]{cfg['model_type']}[/purple]")
-    if all:
-        print("\n[green]Available model IDs[/green]:")
-        for model_id, model_type in MODEL_TYPES.items():
-            print(f"\t[blue]{model_id}[/blue]: [purple]{model_type}[/purple]")
-@embedding.command("add", help="Add an embedding model config to janus")
-def embedding_add(
-    model_name: Annotated[
-        str, typer.Argument(help="The user's custom name for the model")
-    ],
-    model_type: Annotated[
-        str,
-        typer.Option(
-            "--type",
-            "-t",
-            help="The type of the model",
-            click_type=click.Choice(list(val.value for val in EmbeddingModelType)),
-        ),
-    ] = "OpenAI",
-):
-    if not EMBEDDING_MODEL_CONFIG_DIR.exists():
-        EMBEDDING_MODEL_CONFIG_DIR.mkdir(parents=True)
-    model_cfg = EMBEDDING_MODEL_CONFIG_DIR / f"{model_name}.json"
-    if model_type in EmbeddingModelType.HuggingFaceInferenceAPI.values:
-        hf = typer.style("HuggingFaceInferenceAPI", fg="yellow")
-        url = typer.prompt(f"Enter the {hf} model's URL", type=str, value_proc=AnyHttpUrl)
-        api_model_name = typer.prompt("Enter the model's name", type=str, default="")
-        api_key = typer.prompt("Enter the API key", type=str, default="")
-        max_tokens = typer.prompt(
-            "Enter the model's maximum tokens", default=8191, type=int
-        )
-        in_cost = typer.prompt("Enter the cost per input token", default=0, type=float)
-        out_cost = typer.prompt("Enter the cost per output token", default=0, type=float)
-        params = dict(
-            model_name=api_model_name,
-            api_key=api_key,
-        )
-        cfg = {
-            "model_type": model_type,
-            "model_identifier": str(url),
-            "model_args": params,
-            "token_limit": max_tokens,
-            "model_cost": {"input": in_cost, "output": out_cost},
-        }
-    elif model_type in EmbeddingModelType.HuggingFaceLocal.values:
-        hf = typer.style("HuggingFace", fg="yellow")
-        model_id = typer.prompt(
-            f"Enter the {hf} model ID",
-            default="sentence-transformers/all-MiniLM-L6-v2",
-            type=str,
-        )
-        cache_folder = str(
-            Path(
-                typer.prompt(
-                    "Enter the model's cache folder",
-                    default=EMBEDDING_MODEL_CONFIG_DIR / "cache",
-                    type=str,
-                )
-            )
-        )
-        max_tokens = typer.prompt(
-            "Enter the model's maximum tokens", default=8191, type=int
-        )
-        params = dict(
-            cache_folder=str(cache_folder),
-        )
-        cfg = {
-            "model_type": model_type,
-            "model_identifier": model_id,
-            "model_args": params,
-            "token_limit": max_tokens,
-            "model_cost": {"input": 0, "output": 0},
-        }
-    elif model_type in EmbeddingModelType.OpenAI.values:
-        available_models = list(EMBEDDING_COST_PER_MODEL.keys())
-        open_ai = typer.style("OpenAI", fg="green")
-        prompt = f"Enter the {open_ai} model name"
-        model_name = typer.prompt(
-            prompt,
-            default="text-embedding-3-small",
-            type=click.types.Choice(available_models),
-            show_choices=False,
-        )
-        params = dict(
-            model=model_name,
-        )
-        max_tokens = EMBEDDING_TOKEN_LIMITS[model_name]
-        model_cost = EMBEDDING_COST_PER_MODEL[model_name]
-        cfg = {
-            "model_type": model_type,
-            "model_identifier": model_name,
-            "model_args": params,
-            "token_limit": max_tokens,
-            "model_cost": model_cost,
-        }
-    else:
-        raise ValueError(f"Unknown model type {model_type}")
-    with open(model_cfg, "w") as f:
-        json.dump(cfg, f, indent=2)
-    print(f"Model config written to {model_cfg}")
-app.add_typer(db, name="db")
-app.add_typer(llm, name="llm")
-app.add_typer(evaluate, name="evaluate")
-app.add_typer(embedding, name="embedding")
-@app.command()
-def render(
-    input_dir: Annotated[
-        str,
-        typer.Option(
-            "--input",
-            "-i",
-        ),
-    ],
-    output_dir: Annotated[str, typer.Option("--output", "-o")],
-):
-    input_dir = Path(input_dir)
-    output_dir = Path(output_dir)
-    for input_file in input_dir.rglob("*.json"):
-        with open(input_file, "r") as f:
-            data = json.load(f)
-        output_file = output_dir / input_file.relative_to(input_dir).with_suffix(".txt")
-        if not output_file.parent.exists():
-            output_file.parent.mkdir()
-        text = data["output"].replace("\\n", "\n").strip()
-        output_file.write_text(text)
-        jar_path = homedir / ".janus/lib/plantuml.jar"
-        subprocess.run(["java", "-jar", jar_path, output_file])  # nosec
-        output_file.unlink()
-if __name__ == "__main__":
-    app()

janus-llm 4.3.1__py3-none-any.whl → 4.3.5__py3-none-any.whl

janus-llm 4.3.1py3-none-any.whl → 4.3.5py3-none-any.whl