PyPI - cat-llm - Versions diffs - 0.0.27__py3-none-any.whl → 0.0.29__py3-none-any.whl - Mend

cat-llm 0.0.27py3-none-any.whl → 0.0.29py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (9) hide show

{cat_llm-0.0.27.dist-info → cat_llm-0.0.29.dist-info}/METADATA +1 -1
cat_llm-0.0.29.dist-info/RECORD +9 -0
catllm/CERAD_functions.py +50 -22
catllm/__about__.py +1 -1
catllm/cat_llm.py +2 -3
catllm/image_functions.py +157 -83
cat_llm-0.0.27.dist-info/RECORD +0 -9
{cat_llm-0.0.27.dist-info → cat_llm-0.0.29.dist-info}/WHEEL +0 -0
{cat_llm-0.0.27.dist-info → cat_llm-0.0.29.dist-info}/licenses/LICENSE +0 -0

{cat_llm-0.0.27.dist-info → cat_llm-0.0.29.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: cat-llm
-Version: 0.0.27
+Version: 0.0.29
 Summary: A tool for categorizing text data and images using LLMs and vision models
 Project-URL: Documentation, https://github.com/chrissoria/cat-llm#readme
 Project-URL: Issues, https://github.com/chrissoria/cat-llm/issues

cat_llm-0.0.29.dist-info/RECORD ADDED Viewed

@@ -0,0 +1,9 @@
+catllm/CERAD_functions.py,sha256=KaKrtw71VGNzWBRv7B_dMwGT6iYg3D7G5l5nUFKImMw,18332
+catllm/__about__.py,sha256=QnNiB46oNOtCa5XpK0snsSnXws0EtbKwFamcLpxgaIk,404
+catllm/__init__.py,sha256=kLk180aJna1s-wU6CLr4_hKkbjoeET-11jGmC1pdhQw,330
+catllm/cat_llm.py,sha256=TNsjYKpr8ZH9jeAYN-4DcFcrnR8x2eRl99oXzpdhE0Q,16910
+catllm/image_functions.py,sha256=JLlv5qQhAQzgsRIY18rUPtM1P7x1Fw2UlWlI1dpv3dA,31272
+cat_llm-0.0.29.dist-info/METADATA,sha256=CPxmYv0wGD7HMY-rMyNa3wYR6sZ7d1Okg2SWJaqAHa0,1679
+cat_llm-0.0.29.dist-info/WHEEL,sha256=qtCwoSJWgHk21S1Kb4ihdzI2rlJ1ZKaIurTj_ngOhyQ,87
+cat_llm-0.0.29.dist-info/licenses/LICENSE,sha256=wJLsvOr6lrFUDcoPXExa01HOKFWrS3JC9f0RudRw8uw,1075
+cat_llm-0.0.29.dist-info/RECORD,,

catllm/CERAD_functions.py CHANGED Viewed

@@ -130,28 +130,56 @@ def cerad_drawn_score(
             reference_text = f"This image contains a perfect reference image of a {shape}. Next to is a drawing that is meant to be similar to the reference {shape}.\n\n"
         else:
             reference_text = f"Image is expected to show within it a drawing of a {shape}.\n\n"
-        prompt = [
-            {
-                "type": "text",
-                "text": (
-                    f"You are an image-tagging assistant trained in the CERAD Constructional Praxis test.\n"
-                    f"Task ► Examine the attached image and decide, **for each category below**, "
-                    f"whether it is PRESENT (1) or NOT PRESENT (0).\n\n"
-                    f"{reference_text}"
-                    f"Categories:\n{categories_str}\n\n"
-                    f"Output format ► Respond with **only** a JSON object whose keys are the "
-                    f"quoted category numbers ('1', '2', …) and whose values are 1 or 0. "
-                    f"No additional keys, comments, or text.\n\n"
-                    f"Example:\n"
-                    f"{example_JSON}"
-                ),
-            },
-            {
-                "type": "image_url",
-                "image_url": {"url": encoded_image, "detail": "high"},
-            },
-        ]
+        if model_source == "OpenAI":
+            prompt = [
+                {
+                    "type": "text",
+                    "text": (
+                        f"You are an image-tagging assistant trained in the CERAD Constructional Praxis test.\n"
+                        f"Task ► Examine the attached image and decide, **for each category below**, "
+                        f"whether it is PRESENT (1) or NOT PRESENT (0).\n\n"
+                        f"{reference_text}"
+                        f"Categories:\n{categories_str}\n\n"
+                        f"Output format ► Respond with **only** a JSON object whose keys are the "
+                        f"quoted category numbers ('1', '2', …) and whose values are 1 or 0. "
+                        f"No additional keys, comments, or text.\n\n"
+                        f"Example:\n"
+                        f"{example_JSON}"
+                        ),
+                        },
+                        {
+                            "type": "image_url",
+                            "image_url": {"url": encoded_image, "detail": "high"},
+                            },
+            ]
+        elif model_source == "Anthropic":
+            prompt = [
+                {
+                    "type": "text",
+                    "text": (
+                        f"You are an image-tagging assistant trained in the CERAD Constructional Praxis test.\n"
+                        f"Task ► Examine the attached image and decide, **for each category below**, "
+                        f"whether it is PRESENT (1) or NOT PRESENT (0).\n\n"
+                        f"{reference_text}"
+                        f"Categories:\n{categories_str}\n\n"
+                        f"Output format ► Respond with **only** a JSON object whose keys are the "
+                        f"quoted category numbers ('1', '2', …) and whose values are 1 or 0. "
+                        f"No additional keys, comments, or text.\n\n"
+                        f"Example:\n"
+                        f"{example_JSON}"
+                    ),
+                },
+                {
+                    "type": "image",
+                    "source": {
+                        "type": "base64",
+                        "media_type": "image/jpeg",
+                        "data": encoded
+                    }
+                    },
+            ]
         if model_source == "OpenAI":
             from openai import OpenAI
             client = OpenAI(api_key=api_key)

catllm/__about__.py CHANGED Viewed

@@ -1,7 +1,7 @@
 # SPDX-FileCopyrightText: 2025-present Christopher Soria <chrissoria@berkeley.edu>
 #
 # SPDX-License-Identifier: MIT
-__version__ = "0.0.27"
+__version__ = "0.0.29"
 __author__ = "Chris Soria"
 __email__ = "chrissoria@berkeley.edu"
 __title__ = "cat-llm"

catllm/cat_llm.py CHANGED Viewed

@@ -219,7 +219,7 @@ Return the top {top_n} categories as a numbered list sorted from the most to lea
     return top_categories_final
 #multi-class text classification
-def extract_multi_class(
+def multi_class(
     survey_question,
     survey_input,
     categories,
@@ -391,5 +391,4 @@ Provide your work in JSON format where the number belonging to each category is
             save_directory = os.getcwd()
         categorized_data.to_csv(os.path.join(save_directory, filename), index=False)
-    return categorized_data
+    return categorized_data

catllm/image_functions.py CHANGED Viewed

@@ -1,5 +1,5 @@
 # image multi-class (binary) function
-def extract_image_multi_class(
+def image_multi_class(
     image_description,
     image_input,
     categories,
@@ -96,7 +96,7 @@ def extract_image_multi_class(
                 },
             ]
-        if model_source == "Anthropic":
+        elif model_source == "Anthropic":
             encoded_image = f"data:image/{ext};base64,{encoded}"
             prompt = [
                 {"type": "text",
@@ -171,7 +171,7 @@ def extract_image_multi_class(
                 print(f"An error occurred: {e}")
                 link1.append(f"Error processing input: {e}")
         else:
-            raise ValueError("Unknown source! Choose from OpenAI, Anthropic, Perplexity, or Mistral")
+            raise ValueError("Unknown source! Choose from OpenAI, Anthropic, or Mistral")
             # in situation that no JSON is found
         if reply is not None:
             extracted_json = regex.findall(r'\{(?:[^{}]|(?R))*\}', reply, regex.DOTALL)
@@ -240,7 +240,7 @@ def extract_image_multi_class(
     return categorized_data
 #image score function
-def extract_image_score(
+def image_score(
     reference_image_description,
     image_input,
     reference_image,
@@ -288,7 +288,8 @@ def extract_image_score(
         print(f"Provided a list of {len(image_input)} images.")
     with open(reference_image, 'rb') as f:
-        reference_image = f"data:image/{reference_image.split('.')[-1]};base64,{base64.b64encode(f.read()).decode('utf-8')}"
+        reference = base64.b64encode(f.read()).decode('utf-8')
+        reference_image = f"data:image/{reference_image.split('.')[-1]};base64,{reference}"
     link1 = []
     extracted_jsons = []
@@ -308,40 +309,87 @@ def extract_image_score(
         ext = Path(img_path).suffix.lstrip(".").lower()
         encoded_image = f"data:image/{ext};base64,{encoded}"
-        prompt = [
-            {
-                "type": "text",
-                "text": (
-                    f"You are a visual similarity assessment system.\n"
-            f"Task ► Compare these two images:\n"
-            f"1. REFERENCE (left): {reference_image_description}\n"
-            f"2. INPUT (right): User-provided drawing\n\n"
-            f"Rating criteria:\n"
-            f"1: No meaningful similarity (fundamentally different)\n"
-            f"2: Barely recognizable similarity (25% match)\n"
-            f"3: Partial match (50% key features)\n"
-            f"4: Strong alignment (75% features)\n"
-            f"5: Near-perfect match (90%+ similarity)\n\n"
-            f"Output format ► Return ONLY:\n"
-            "{\n"
-            '  "score": [1-5],\n'
-            '  "summary": "reason you scored"\n'
-            "}\n\n"
-            f"Critical rules:\n"
-            f"- Score must reflect shape, proportions, and key details\n"
-            f"- List only concrete matching elements from reference\n"
-            f"- No markdown or additional text"
-                ),
-            },
-            {"type": "image_url",
-             "image_url": {"url": reference_image, "detail": "high"}
-             },
-            {
-                "type": "image_url",
-                "image_url": {"url": encoded_image, "detail": "high"},
-            },
-        ]
+        if model_source == "OpenAI":
+            prompt = [
+                {
+                    "type": "text",
+                    "text": (
+                        f"You are a visual similarity assessment system.\n"
+                        f"Task ► Compare these two images:\n"
+                        f"1. REFERENCE (left): {reference_image_description}\n"
+                        f"2. INPUT (right): User-provided drawing\n\n"
+                        f"Rating criteria:\n"
+                        f"1: No meaningful similarity (fundamentally different)\n"
+                        f"2: Barely recognizable similarity (25% match)\n"
+                        f"3: Partial match (50% key features)\n"
+                        f"4: Strong alignment (75% features)\n"
+                        f"5: Near-perfect match (90%+ similarity)\n\n"
+                        f"Output format ► Return ONLY:\n"
+                        "{\n"
+                        '  "score": [1-5],\n'
+                        '  "summary": "reason you scored"\n'
+                        "}\n\n"
+                        f"Critical rules:\n"
+                        f"- Score must reflect shape, proportions, and key details\n"
+                        f"- List only concrete matching elements from reference\n"
+                        f"- No markdown or additional text"
+                    )
+                },
+                {
+                    "type": "image_url",
+                    "image_url": {"url": reference_image, "detail": "high"}
+                },
+                {
+                    "type": "image_url",
+                    "image_url": {"url": encoded_image, "detail": "high"}
+                }
+            ]
+        elif model_source == "Anthropic":  # Changed to elif
+            prompt = [
+                {
+                    "type": "text",
+                    "text": (
+                        f"You are a visual similarity assessment system.\n"
+                        f"Task ► Compare these two images:\n"
+                        f"1. REFERENCE (left): {reference_image_description}\n"
+                        f"2. INPUT (right): User-provided drawing\n\n"
+                        f"Rating criteria:\n"
+                        f"1: No meaningful similarity (fundamentally different)\n"
+                        f"2: Barely recognizable similarity (25% match)\n"
+                        f"3: Partial match (50% key features)\n"
+                        f"4: Strong alignment (75% features)\n"
+                        f"5: Near-perfect match (90%+ similarity)\n\n"
+                        f"Output format ► Return ONLY:\n"
+                        "{\n"
+                        '  "score": [1-5],\n'
+                        '  "summary": "reason you scored"\n'
+                        "}\n\n"
+                        f"Critical rules:\n"
+                        f"- Score must reflect shape, proportions, and key details\n"
+                        f"- List only concrete matching elements from reference\n"
+                        f"- No markdown or additional text"
+                    )
+                },
+                {
+                    "type": "image",  # Added missing type
+                    "source": {
+                        "type": "base64",
+                        "media_type": "image/png",
+                        "data": reference
+                    }
+                },
+                {
+                    "type": "image",  # Added missing type
+                    "source": {
+                        "type": "base64",
+                        "media_type": "image/jpeg",
+                        "data": encoded
+                    }
+                }
+            ]
         if model_source == "OpenAI":
             from openai import OpenAI
             client = OpenAI(api_key=api_key)
@@ -357,20 +405,6 @@ def extract_image_score(
                 print(f"An error occurred: {e}")
                 link1.append(f"Error processing input: {e}")
-        elif model_source == "Perplexity":
-            from openai import OpenAI
-            client = OpenAI(api_key=api_key, base_url="https://api.perplexity.ai")
-            try:
-                response_obj = client.chat.completions.create(
-                    model=user_model,
-                    messages=[{'role': 'user', 'content': prompt}],
-                    temperature=creativity
-                )
-                reply = response_obj.choices[0].message.content
-                link1.append(reply)
-            except Exception as e:
-                print(f"An error occurred: {e}")
-                link1.append(f"Error processing input: {e}")
         elif model_source == "Anthropic":
             import anthropic
             client = anthropic.Anthropic(api_key=api_key)
@@ -386,6 +420,7 @@ def extract_image_score(
             except Exception as e:
                 print(f"An error occurred: {e}")
                 link1.append(f"Error processing input: {e}")
         elif model_source == "Mistral":
             from mistralai import Mistral
             client = Mistral(api_key=api_key)
@@ -468,7 +503,7 @@ def extract_image_score(
     return categorized_data
 # image features function
-def extract_image_features(
+def image_features(
     image_description,
     image_input,
     features_to_extract,
@@ -530,41 +565,80 @@ def extract_image_features(
     for i, img_path in enumerate(
         tqdm(image_files, desc="Categorising images"), start=0):
+        if img_path is None or not os.path.exists(img_path):
+            link1.append("Skipped NaN input or invalid path")
+            extracted_jsons.append("""{"no_valid_image": 1}""")
+            continue  # Skip the rest of the loop iteration
     # encode this specific image once
         with open(img_path, "rb") as f:
             encoded = base64.b64encode(f.read()).decode("utf-8")
         ext = Path(img_path).suffix.lstrip(".").lower()
         encoded_image = f"data:image/{ext};base64,{encoded}"
-        prompt = [
-            {
-                "type": "text",
-                "text": (
-                    f"You are a visual question answering assistant.\n"
-            f"Task ► Analyze the attached image and answer these specific questions:\n\n"
-            f"Image context: {image_description}\n\n"
-            f"Questions to answer:\n{categories_str}\n\n"
-            f"Output format ► Return **only** a JSON object where:\n"
-            f"- Keys are question numbers ('1', '2', ...)\n"
-            f"- Values are concise answers (numbers, short phrases)\n\n"
-            f"Example for 3 questions:\n"
-            "{\n"
-            '  "1": "4",\n'
-            '  "2": "blue",\n'
-            '  "3": "yes"\n'
-            "}\n\n"
-            f"Important rules:\n"
-            f"1. Answer directly - no explanations\n"
-            f"2. Use exact numerical values when possible\n"
-            f"3. For yes/no questions, use 'yes' or 'no'\n"
-            f"4. Never add extra keys or formatting"
-                ),
-            },
-            {
-                "type": "image_url",
-                "image_url": {"url": encoded_image, "detail": "high"},
-            },
-        ]
+        if model_source == "OpenAI":
+            prompt = [
+                {
+                    "type": "text",
+                    "text": (
+                        f"You are a visual question answering assistant.\n"
+                        f"Task ► Analyze the attached image and answer these specific questions:\n\n"
+                        f"Image context: {image_description}\n\n"
+                        f"Questions to answer:\n{categories_str}\n\n"
+                        f"Output format ► Return **only** a JSON object where:\n"
+                        f"- Keys are question numbers ('1', '2', ...)\n"
+                        f"- Values are concise answers (numbers, short phrases)\n\n"
+                        f"Example for 3 questions:\n"
+                        "{\n"
+                        '  "1": "4",\n'
+                        '  "2": "blue",\n'
+                        '  "3": "yes"\n'
+                        "}\n\n"
+                        f"Important rules:\n"
+                        f"1. Answer directly - no explanations\n"
+                        f"2. Use exact numerical values when possible\n"
+                        f"3. For yes/no questions, use 'yes' or 'no'\n"
+                        f"4. Never add extra keys or formatting"
+                        ),
+                        },
+                        {
+                            "type": "image_url",
+                            "image_url": {"url": encoded_image, "detail": "high"},
+                            },
+            ]
+        elif model_source == "Anthropic":
+            prompt = [
+                {
+                    "type": "text",
+                    "text": (
+                        f"You are a visual question answering assistant.\n"
+                        f"Task ► Analyze the attached image and answer these specific questions:\n\n"
+                        f"Image context: {image_description}\n\n"
+                        f"Questions to answer:\n{categories_str}\n\n"
+                        f"Output format ► Return **only** a JSON object where:\n"
+                        f"- Keys are question numbers ('1', '2', ...)\n"
+                        f"- Values are concise answers (numbers, short phrases)\n\n"
+                        f"Example for 3 questions:\n"
+                        "{\n"
+                        '  "1": "4",\n'
+                        '  "2": "blue",\n'
+                        '  "3": "yes"\n'
+                        "}\n\n"
+                        f"Important rules:\n"
+                        f"1. Answer directly - no explanations\n"
+                        f"2. Use exact numerical values when possible\n"
+                        f"3. For yes/no questions, use 'yes' or 'no'\n"
+                        f"4. Never add extra keys or formatting"
+                    )
+                },
+                {
+                    "type": "image",
+                    "source": {
+                        "type": "base64",
+                        "media_type": "image/jpeg",
+                        "data": encoded
+                    }
+                }
+            ]
         if model_source == "OpenAI":
             from openai import OpenAI
             client = OpenAI(api_key=api_key)

cat_llm-0.0.27.dist-info/RECORD DELETED Viewed

@@ -1,9 +0,0 @@
-catllm/CERAD_functions.py,sha256=mtHxshRWmWXMH9kkkCfbMHXgDe00EVabjFiN8s73LPI,16935
-catllm/__about__.py,sha256=H3dYrI6XpHXpRmgCCiw8u2dIaFZWRsw7RxfRy_aIlaQ,404
-catllm/__init__.py,sha256=kLk180aJna1s-wU6CLr4_hKkbjoeET-11jGmC1pdhQw,330
-catllm/cat_llm.py,sha256=Rwyz93caNf0h9tfurObY6qDjtG6EKaYXR0GrVW7h2kU,16920
-catllm/image_functions.py,sha256=rMa7Jb565Rp75pbRKYF8Sqk_Uwuv60olMU0Mbvbq55s,27440
-cat_llm-0.0.27.dist-info/METADATA,sha256=ocT3Y5NoA9csBGpSkg0G_PCPPhbm_EgWiNicpf9Xf-I,1679
-cat_llm-0.0.27.dist-info/WHEEL,sha256=qtCwoSJWgHk21S1Kb4ihdzI2rlJ1ZKaIurTj_ngOhyQ,87
-cat_llm-0.0.27.dist-info/licenses/LICENSE,sha256=wJLsvOr6lrFUDcoPXExa01HOKFWrS3JC9f0RudRw8uw,1075
-cat_llm-0.0.27.dist-info/RECORD,,

{cat_llm-0.0.27.dist-info → cat_llm-0.0.29.dist-info}/WHEEL RENAMED Viewed

File without changes

{cat_llm-0.0.27.dist-info → cat_llm-0.0.29.dist-info}/licenses/LICENSE RENAMED Viewed

File without changes

cat-llm 0.0.27__py3-none-any.whl → 0.0.29__py3-none-any.whl

cat-llm 0.0.27py3-none-any.whl → 0.0.29py3-none-any.whl