vision-agent 0.0.10__py3-none-any.whl → 0.0.11__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
vision_agent/data/data.py CHANGED
@@ -2,7 +2,7 @@ from __future__ import annotations
2
2
 
3
3
  import uuid
4
4
  from pathlib import Path
5
- from typing import Dict, List, Optional, Union, cast
5
+ from typing import Dict, List, Optional, Union, cast, Callable
6
6
 
7
7
  import faiss
8
8
  import numpy as np
@@ -44,18 +44,25 @@ class DataStore:
44
44
  self.lmm = lmm
45
45
  return self
46
46
 
47
- def add_column(self, name: str, prompt: str) -> Self:
47
+ def add_column(
48
+ self, name: str, prompt: str, func: Optional[Callable[[str], str]] = None
49
+ ) -> Self:
48
50
  r"""Adds a new column to the DataFrame containing the generated metadata from the LMM.
49
51
 
50
52
  Args:
51
53
  name (str): The name of the column to be added.
52
54
  prompt (str): The prompt to be used to generate the metadata.
55
+ func (Optional[Callable[[Any], Any]]): A Python function to be applied on the output of `lmm.generate`. Defaults to None.
53
56
  """
54
57
  if self.lmm is None:
55
58
  raise ValueError("LMM not set yet")
56
59
 
57
60
  self.df[name] = self.df["image_paths"].progress_apply( # type: ignore
58
- lambda x: self.lmm.generate(prompt, image=x)
61
+ lambda x: (
62
+ func(self.lmm.generate(prompt, image=x))
63
+ if func
64
+ else self.lmm.generate(prompt, image=x)
65
+ )
59
66
  )
60
67
  return self
61
68
 
vision_agent/lmm/lmm.py CHANGED
@@ -31,10 +31,18 @@ class LLaVALMM(LMM):
31
31
  def __init__(self, name: str):
32
32
  self.name = name
33
33
 
34
- def generate(self, prompt: str, image: Optional[Union[str, Path]] = None) -> str:
34
+ def generate(
35
+ self,
36
+ prompt: str,
37
+ image: Optional[Union[str, Path]] = None,
38
+ temperature: float = 0.1,
39
+ max_new_tokens: int = 1500,
40
+ ) -> str:
35
41
  data = {"prompt": prompt}
36
42
  if image:
37
43
  data["image"] = encode_image(image)
44
+ data["temperature"] = temperature # type: ignore
45
+ data["max_new_tokens"] = max_new_tokens # type: ignore
38
46
  res = requests.post(
39
47
  _LLAVA_ENDPOINT,
40
48
  headers={"Content-Type": "application/json"},
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: vision-agent
3
- Version: 0.0.10
3
+ Version: 0.0.11
4
4
  Summary: Toolset for Vision Agent
5
5
  Author: Landing AI
6
6
  Author-email: dev@landing.ai
@@ -1,11 +1,11 @@
1
1
  vision_agent/__init__.py,sha256=CpcsVD1aYoCoOD-LNlHAehJPSZBYTtK6CFjiqXUTMAY,172
2
2
  vision_agent/data/__init__.py,sha256=YU-5g3LbEQ6a4drz0RLGTagXMVU2Z4Xr3RlfWE-R0jU,46
3
- vision_agent/data/data.py,sha256=iSLmxPzswQ0g1TOUgBDWBbpF6X8PSAk15oGQxQjhX-o,4833
3
+ vision_agent/data/data.py,sha256=7hM_YprDDgLqreg_qsc-udEUe8cfJQ3-xg6BlVNBG0k,5154
4
4
  vision_agent/emb/__init__.py,sha256=YmCkGrJBtXb6X6Z3lnKiFoQYKXMgHMJp8JJyMLVvqcI,75
5
5
  vision_agent/emb/emb.py,sha256=la9lhEzk7jqUCjYYQ5oRgVNSnC9_EJBJIpE_B9c6PJo,1375
6
6
  vision_agent/lmm/__init__.py,sha256=I8mbeNUajTfWVNqLsuFQVOaNBDlkIhYp9DFU8H4kB7g,51
7
- vision_agent/lmm/lmm.py,sha256=jPk6rRKUNfKN8P-ShCDosfCtfGkj3aU74x1U8vrZ7yg,2695
8
- vision_agent-0.0.10.dist-info/LICENSE,sha256=xx0jnfkXJvxRnG63LTGOxlggYnIysveWIZ6H3PNdCrQ,11357
9
- vision_agent-0.0.10.dist-info/METADATA,sha256=-6Oyb1M-BjjGhonR0vCvXkEwjIJdDI-phYKfjcQ3lA0,3795
10
- vision_agent-0.0.10.dist-info/WHEEL,sha256=7Z8_27uaHI_UZAc4Uox4PpBhQ9Y5_modZXWMxtUi4NU,88
11
- vision_agent-0.0.10.dist-info/RECORD,,
7
+ vision_agent/lmm/lmm.py,sha256=pNUs5XUKUubksFEK_58euE9HPKoPV30mRKtDBEb93MQ,2918
8
+ vision_agent-0.0.11.dist-info/LICENSE,sha256=xx0jnfkXJvxRnG63LTGOxlggYnIysveWIZ6H3PNdCrQ,11357
9
+ vision_agent-0.0.11.dist-info/METADATA,sha256=CDuOoFqKfzB0F5a_mWRaLi9kvskMouD2gDygdVyxbsk,3795
10
+ vision_agent-0.0.11.dist-info/WHEEL,sha256=7Z8_27uaHI_UZAc4Uox4PpBhQ9Y5_modZXWMxtUi4NU,88
11
+ vision_agent-0.0.11.dist-info/RECORD,,