PyPI - cat-llm - Versions diffs - 0.0.27__py3-none-any.whl → 0.0.28__py3-none-any.whl - Mend

cat-llm 0.0.27py3-none-any.whl → 0.0.28py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (7) hide show

{cat_llm-0.0.27.dist-info → cat_llm-0.0.28.dist-info}/METADATA +1 -1
cat_llm-0.0.28.dist-info/RECORD +9 -0
catllm/__about__.py +1 -1
catllm/image_functions.py +157 -83
cat_llm-0.0.27.dist-info/RECORD +0 -9
{cat_llm-0.0.27.dist-info → cat_llm-0.0.28.dist-info}/WHEEL +0 -0
{cat_llm-0.0.27.dist-info → cat_llm-0.0.28.dist-info}/licenses/LICENSE +0 -0

{cat_llm-0.0.27.dist-info → cat_llm-0.0.28.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: cat-llm
-Version: 0.0.27
+Version: 0.0.28
 Summary: A tool for categorizing text data and images using LLMs and vision models
 Project-URL: Documentation, https://github.com/chrissoria/cat-llm#readme
 Project-URL: Issues, https://github.com/chrissoria/cat-llm/issues

cat_llm-0.0.28.dist-info/RECORD ADDED Viewed

@@ -0,0 +1,9 @@
+catllm/CERAD_functions.py,sha256=mtHxshRWmWXMH9kkkCfbMHXgDe00EVabjFiN8s73LPI,16935
+catllm/__about__.py,sha256=ZBz_2FX253RxgXFq-1v4qkfIEZi38fNzs_Rp2e3ZdCo,404
+catllm/__init__.py,sha256=kLk180aJna1s-wU6CLr4_hKkbjoeET-11jGmC1pdhQw,330
+catllm/cat_llm.py,sha256=Rwyz93caNf0h9tfurObY6qDjtG6EKaYXR0GrVW7h2kU,16920
+catllm/image_functions.py,sha256=JLlv5qQhAQzgsRIY18rUPtM1P7x1Fw2UlWlI1dpv3dA,31272
+cat_llm-0.0.28.dist-info/METADATA,sha256=zcHC8uPOLGIr9GOeq1Qyf04WebFdYEY5p4f8ZoZAwHg,1679
+cat_llm-0.0.28.dist-info/WHEEL,sha256=qtCwoSJWgHk21S1Kb4ihdzI2rlJ1ZKaIurTj_ngOhyQ,87
+cat_llm-0.0.28.dist-info/licenses/LICENSE,sha256=wJLsvOr6lrFUDcoPXExa01HOKFWrS3JC9f0RudRw8uw,1075
+cat_llm-0.0.28.dist-info/RECORD,,

catllm/__about__.py CHANGED Viewed

@@ -1,7 +1,7 @@
 # SPDX-FileCopyrightText: 2025-present Christopher Soria <chrissoria@berkeley.edu>
 #
 # SPDX-License-Identifier: MIT
-__version__ = "0.0.27"
+__version__ = "0.0.28"
 __author__ = "Chris Soria"
 __email__ = "chrissoria@berkeley.edu"
 __title__ = "cat-llm"

catllm/image_functions.py CHANGED Viewed

@@ -1,5 +1,5 @@
 # image multi-class (binary) function
-def extract_image_multi_class(
+def image_multi_class(
     image_description,
     image_input,
     categories,
@@ -96,7 +96,7 @@ def extract_image_multi_class(
                 },
             ]
-        if model_source == "Anthropic":
+        elif model_source == "Anthropic":
             encoded_image = f"data:image/{ext};base64,{encoded}"
             prompt = [
                 {"type": "text",
@@ -171,7 +171,7 @@ def extract_image_multi_class(
                 print(f"An error occurred: {e}")
                 link1.append(f"Error processing input: {e}")
         else:
-            raise ValueError("Unknown source! Choose from OpenAI, Anthropic, Perplexity, or Mistral")
+            raise ValueError("Unknown source! Choose from OpenAI, Anthropic, or Mistral")
             # in situation that no JSON is found
         if reply is not None:
             extracted_json = regex.findall(r'\{(?:[^{}]|(?R))*\}', reply, regex.DOTALL)
@@ -240,7 +240,7 @@ def extract_image_multi_class(
     return categorized_data
 #image score function
-def extract_image_score(
+def image_score(
     reference_image_description,
     image_input,
     reference_image,
@@ -288,7 +288,8 @@ def extract_image_score(
         print(f"Provided a list of {len(image_input)} images.")
     with open(reference_image, 'rb') as f:
-        reference_image = f"data:image/{reference_image.split('.')[-1]};base64,{base64.b64encode(f.read()).decode('utf-8')}"
+        reference = base64.b64encode(f.read()).decode('utf-8')
+        reference_image = f"data:image/{reference_image.split('.')[-1]};base64,{reference}"
     link1 = []
     extracted_jsons = []
@@ -308,40 +309,87 @@ def extract_image_score(
         ext = Path(img_path).suffix.lstrip(".").lower()
         encoded_image = f"data:image/{ext};base64,{encoded}"
-        prompt = [
-            {
-                "type": "text",
-                "text": (
-                    f"You are a visual similarity assessment system.\n"
-            f"Task ► Compare these two images:\n"
-            f"1. REFERENCE (left): {reference_image_description}\n"
-            f"2. INPUT (right): User-provided drawing\n\n"
-            f"Rating criteria:\n"
-            f"1: No meaningful similarity (fundamentally different)\n"
-            f"2: Barely recognizable similarity (25% match)\n"
-            f"3: Partial match (50% key features)\n"
-            f"4: Strong alignment (75% features)\n"
-            f"5: Near-perfect match (90%+ similarity)\n\n"
-            f"Output format ► Return ONLY:\n"
-            "{\n"
-            '  "score": [1-5],\n'
-            '  "summary": "reason you scored"\n'
-            "}\n\n"
-            f"Critical rules:\n"
-            f"- Score must reflect shape, proportions, and key details\n"
-            f"- List only concrete matching elements from reference\n"
-            f"- No markdown or additional text"
-                ),
-            },
-            {"type": "image_url",
-             "image_url": {"url": reference_image, "detail": "high"}
-             },
-            {
-                "type": "image_url",
-                "image_url": {"url": encoded_image, "detail": "high"},
-            },
-        ]
+        if model_source == "OpenAI":
+            prompt = [
+                {
+                    "type": "text",
+                    "text": (
+                        f"You are a visual similarity assessment system.\n"
+                        f"Task ► Compare these two images:\n"
+                        f"1. REFERENCE (left): {reference_image_description}\n"
+                        f"2. INPUT (right): User-provided drawing\n\n"
+                        f"Rating criteria:\n"
+                        f"1: No meaningful similarity (fundamentally different)\n"
+                        f"2: Barely recognizable similarity (25% match)\n"
+                        f"3: Partial match (50% key features)\n"
+                        f"4: Strong alignment (75% features)\n"
+                        f"5: Near-perfect match (90%+ similarity)\n\n"
+                        f"Output format ► Return ONLY:\n"
+                        "{\n"
+                        '  "score": [1-5],\n'
+                        '  "summary": "reason you scored"\n'
+                        "}\n\n"
+                        f"Critical rules:\n"
+                        f"- Score must reflect shape, proportions, and key details\n"
+                        f"- List only concrete matching elements from reference\n"
+                        f"- No markdown or additional text"
+                    )
+                },
+                {
+                    "type": "image_url",
+                    "image_url": {"url": reference_image, "detail": "high"}
+                },
+                {
+                    "type": "image_url",
+                    "image_url": {"url": encoded_image, "detail": "high"}
+                }
+            ]
+        elif model_source == "Anthropic":  # Changed to elif
+            prompt = [
+                {
+                    "type": "text",
+                    "text": (
+                        f"You are a visual similarity assessment system.\n"
+                        f"Task ► Compare these two images:\n"
+                        f"1. REFERENCE (left): {reference_image_description}\n"
+                        f"2. INPUT (right): User-provided drawing\n\n"
+                        f"Rating criteria:\n"
+                        f"1: No meaningful similarity (fundamentally different)\n"
+                        f"2: Barely recognizable similarity (25% match)\n"
+                        f"3: Partial match (50% key features)\n"
+                        f"4: Strong alignment (75% features)\n"
+                        f"5: Near-perfect match (90%+ similarity)\n\n"
+                        f"Output format ► Return ONLY:\n"
+                        "{\n"
+                        '  "score": [1-5],\n'
+                        '  "summary": "reason you scored"\n'
+                        "}\n\n"
+                        f"Critical rules:\n"
+                        f"- Score must reflect shape, proportions, and key details\n"
+                        f"- List only concrete matching elements from reference\n"
+                        f"- No markdown or additional text"
+                    )
+                },
+                {
+                    "type": "image",  # Added missing type
+                    "source": {
+                        "type": "base64",
+                        "media_type": "image/png",
+                        "data": reference
+                    }
+                },
+                {
+                    "type": "image",  # Added missing type
+                    "source": {
+                        "type": "base64",
+                        "media_type": "image/jpeg",
+                        "data": encoded
+                    }
+                }
+            ]
         if model_source == "OpenAI":
             from openai import OpenAI
             client = OpenAI(api_key=api_key)
@@ -357,20 +405,6 @@ def extract_image_score(
                 print(f"An error occurred: {e}")
                 link1.append(f"Error processing input: {e}")
-        elif model_source == "Perplexity":
-            from openai import OpenAI
-            client = OpenAI(api_key=api_key, base_url="https://api.perplexity.ai")
-            try:
-                response_obj = client.chat.completions.create(
-                    model=user_model,
-                    messages=[{'role': 'user', 'content': prompt}],
-                    temperature=creativity
-                )
-                reply = response_obj.choices[0].message.content
-                link1.append(reply)
-            except Exception as e:
-                print(f"An error occurred: {e}")
-                link1.append(f"Error processing input: {e}")
         elif model_source == "Anthropic":
             import anthropic
             client = anthropic.Anthropic(api_key=api_key)
@@ -386,6 +420,7 @@ def extract_image_score(
             except Exception as e:
                 print(f"An error occurred: {e}")
                 link1.append(f"Error processing input: {e}")
         elif model_source == "Mistral":
             from mistralai import Mistral
             client = Mistral(api_key=api_key)
@@ -468,7 +503,7 @@ def extract_image_score(
     return categorized_data
 # image features function
-def extract_image_features(
+def image_features(
     image_description,
     image_input,
     features_to_extract,
@@ -530,41 +565,80 @@ def extract_image_features(
     for i, img_path in enumerate(
         tqdm(image_files, desc="Categorising images"), start=0):
+        if img_path is None or not os.path.exists(img_path):
+            link1.append("Skipped NaN input or invalid path")
+            extracted_jsons.append("""{"no_valid_image": 1}""")
+            continue  # Skip the rest of the loop iteration
     # encode this specific image once
         with open(img_path, "rb") as f:
             encoded = base64.b64encode(f.read()).decode("utf-8")
         ext = Path(img_path).suffix.lstrip(".").lower()
         encoded_image = f"data:image/{ext};base64,{encoded}"
-        prompt = [
-            {
-                "type": "text",
-                "text": (
-                    f"You are a visual question answering assistant.\n"
-            f"Task ► Analyze the attached image and answer these specific questions:\n\n"
-            f"Image context: {image_description}\n\n"
-            f"Questions to answer:\n{categories_str}\n\n"
-            f"Output format ► Return **only** a JSON object where:\n"
-            f"- Keys are question numbers ('1', '2', ...)\n"
-            f"- Values are concise answers (numbers, short phrases)\n\n"
-            f"Example for 3 questions:\n"
-            "{\n"
-            '  "1": "4",\n'
-            '  "2": "blue",\n'
-            '  "3": "yes"\n'
-            "}\n\n"
-            f"Important rules:\n"
-            f"1. Answer directly - no explanations\n"
-            f"2. Use exact numerical values when possible\n"
-            f"3. For yes/no questions, use 'yes' or 'no'\n"
-            f"4. Never add extra keys or formatting"
-                ),
-            },
-            {
-                "type": "image_url",
-                "image_url": {"url": encoded_image, "detail": "high"},
-            },
-        ]
+        if model_source == "OpenAI":
+            prompt = [
+                {
+                    "type": "text",
+                    "text": (
+                        f"You are a visual question answering assistant.\n"
+                        f"Task ► Analyze the attached image and answer these specific questions:\n\n"
+                        f"Image context: {image_description}\n\n"
+                        f"Questions to answer:\n{categories_str}\n\n"
+                        f"Output format ► Return **only** a JSON object where:\n"
+                        f"- Keys are question numbers ('1', '2', ...)\n"
+                        f"- Values are concise answers (numbers, short phrases)\n\n"
+                        f"Example for 3 questions:\n"
+                        "{\n"
+                        '  "1": "4",\n'
+                        '  "2": "blue",\n'
+                        '  "3": "yes"\n'
+                        "}\n\n"
+                        f"Important rules:\n"
+                        f"1. Answer directly - no explanations\n"
+                        f"2. Use exact numerical values when possible\n"
+                        f"3. For yes/no questions, use 'yes' or 'no'\n"
+                        f"4. Never add extra keys or formatting"
+                        ),
+                        },
+                        {
+                            "type": "image_url",
+                            "image_url": {"url": encoded_image, "detail": "high"},
+                            },
+            ]
+        elif model_source == "Anthropic":
+            prompt = [
+                {
+                    "type": "text",
+                    "text": (
+                        f"You are a visual question answering assistant.\n"
+                        f"Task ► Analyze the attached image and answer these specific questions:\n\n"
+                        f"Image context: {image_description}\n\n"
+                        f"Questions to answer:\n{categories_str}\n\n"
+                        f"Output format ► Return **only** a JSON object where:\n"
+                        f"- Keys are question numbers ('1', '2', ...)\n"
+                        f"- Values are concise answers (numbers, short phrases)\n\n"
+                        f"Example for 3 questions:\n"
+                        "{\n"
+                        '  "1": "4",\n'
+                        '  "2": "blue",\n'
+                        '  "3": "yes"\n'
+                        "}\n\n"
+                        f"Important rules:\n"
+                        f"1. Answer directly - no explanations\n"
+                        f"2. Use exact numerical values when possible\n"
+                        f"3. For yes/no questions, use 'yes' or 'no'\n"
+                        f"4. Never add extra keys or formatting"
+                    )
+                },
+                {
+                    "type": "image",
+                    "source": {
+                        "type": "base64",
+                        "media_type": "image/jpeg",
+                        "data": encoded
+                    }
+                }
+            ]
         if model_source == "OpenAI":
             from openai import OpenAI
             client = OpenAI(api_key=api_key)

cat_llm-0.0.27.dist-info/RECORD DELETED Viewed

@@ -1,9 +0,0 @@
-catllm/CERAD_functions.py,sha256=mtHxshRWmWXMH9kkkCfbMHXgDe00EVabjFiN8s73LPI,16935
-catllm/__about__.py,sha256=H3dYrI6XpHXpRmgCCiw8u2dIaFZWRsw7RxfRy_aIlaQ,404
-catllm/__init__.py,sha256=kLk180aJna1s-wU6CLr4_hKkbjoeET-11jGmC1pdhQw,330
-catllm/cat_llm.py,sha256=Rwyz93caNf0h9tfurObY6qDjtG6EKaYXR0GrVW7h2kU,16920
-catllm/image_functions.py,sha256=rMa7Jb565Rp75pbRKYF8Sqk_Uwuv60olMU0Mbvbq55s,27440
-cat_llm-0.0.27.dist-info/METADATA,sha256=ocT3Y5NoA9csBGpSkg0G_PCPPhbm_EgWiNicpf9Xf-I,1679
-cat_llm-0.0.27.dist-info/WHEEL,sha256=qtCwoSJWgHk21S1Kb4ihdzI2rlJ1ZKaIurTj_ngOhyQ,87
-cat_llm-0.0.27.dist-info/licenses/LICENSE,sha256=wJLsvOr6lrFUDcoPXExa01HOKFWrS3JC9f0RudRw8uw,1075
-cat_llm-0.0.27.dist-info/RECORD,,

{cat_llm-0.0.27.dist-info → cat_llm-0.0.28.dist-info}/WHEEL RENAMED Viewed

File without changes

{cat_llm-0.0.27.dist-info → cat_llm-0.0.28.dist-info}/licenses/LICENSE RENAMED Viewed

File without changes

cat-llm 0.0.27__py3-none-any.whl → 0.0.28__py3-none-any.whl

cat-llm 0.0.27py3-none-any.whl → 0.0.28py3-none-any.whl