vision-agent 0.0.13__tar.gz → 0.0.15__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {vision_agent-0.0.13 → vision_agent-0.0.15}/PKG-INFO +6 -4
- {vision_agent-0.0.13 → vision_agent-0.0.15}/README.md +4 -2
- {vision_agent-0.0.13 → vision_agent-0.0.15}/pyproject.toml +2 -2
- {vision_agent-0.0.13 → vision_agent-0.0.15}/LICENSE +0 -0
- {vision_agent-0.0.13 → vision_agent-0.0.15}/vision_agent/__init__.py +0 -0
- {vision_agent-0.0.13 → vision_agent-0.0.15}/vision_agent/data/__init__.py +0 -0
- {vision_agent-0.0.13 → vision_agent-0.0.15}/vision_agent/data/data.py +0 -0
- {vision_agent-0.0.13 → vision_agent-0.0.15}/vision_agent/emb/__init__.py +0 -0
- {vision_agent-0.0.13 → vision_agent-0.0.15}/vision_agent/emb/emb.py +0 -0
- {vision_agent-0.0.13 → vision_agent-0.0.15}/vision_agent/lmm/__init__.py +0 -0
- {vision_agent-0.0.13 → vision_agent-0.0.15}/vision_agent/lmm/lmm.py +0 -0
@@ -1,10 +1,10 @@
|
|
1
1
|
Metadata-Version: 2.1
|
2
2
|
Name: vision-agent
|
3
|
-
Version: 0.0.
|
3
|
+
Version: 0.0.15
|
4
4
|
Summary: Toolset for Vision Agent
|
5
5
|
Author: Landing AI
|
6
6
|
Author-email: dev@landing.ai
|
7
|
-
Requires-Python: >=3.10,<
|
7
|
+
Requires-Python: >=3.10,<3.12
|
8
8
|
Classifier: Programming Language :: Python :: 3
|
9
9
|
Classifier: Programming Language :: Python :: 3.10
|
10
10
|
Classifier: Programming Language :: Python :: 3.11
|
@@ -27,11 +27,13 @@ Description-Content-Type: text/markdown
|
|
27
27
|
|
28
28
|
[](https://discord.gg/wPdN8RCYew)
|
29
29
|
|
30
|
-
Vision Agent is a
|
30
|
+
Vision Agent is a library for that helps you to use multimodal models to organize and structure your image data. Check out our discord for roadmaps and updates!
|
31
|
+
|
32
|
+
One of the problems of dealing with image data is it can be difficult to organize and search. For example, you might have a bunch of pictures of houses and want to count how many yellow houses you have, or how many houses with adobe roofs. The vision agent library uses LMMs to help create tags or descriptions of images to allow you to search over them, or use them in a database to carry out other operations.
|
31
33
|
|
32
34
|
## Getting Started
|
33
35
|
### LMMs
|
34
|
-
To get started you can
|
36
|
+
To get started, you can use an LMM to start generating text from images. The following code will use the LLaVA-1.6 34B model to generate a description of the image you pass it.
|
35
37
|
|
36
38
|
```python
|
37
39
|
import vision_agent as va
|
@@ -2,11 +2,13 @@
|
|
2
2
|
|
3
3
|
[](https://discord.gg/wPdN8RCYew)
|
4
4
|
|
5
|
-
Vision Agent is a
|
5
|
+
Vision Agent is a library for that helps you to use multimodal models to organize and structure your image data. Check out our discord for roadmaps and updates!
|
6
|
+
|
7
|
+
One of the problems of dealing with image data is it can be difficult to organize and search. For example, you might have a bunch of pictures of houses and want to count how many yellow houses you have, or how many houses with adobe roofs. The vision agent library uses LMMs to help create tags or descriptions of images to allow you to search over them, or use them in a database to carry out other operations.
|
6
8
|
|
7
9
|
## Getting Started
|
8
10
|
### LMMs
|
9
|
-
To get started you can
|
11
|
+
To get started, you can use an LMM to start generating text from images. The following code will use the LLaVA-1.6 34B model to generate a description of the image you pass it.
|
10
12
|
|
11
13
|
```python
|
12
14
|
import vision_agent as va
|
@@ -4,7 +4,7 @@ build-backend = "poetry.core.masonry.api"
|
|
4
4
|
|
5
5
|
[tool.poetry]
|
6
6
|
name = "vision-agent"
|
7
|
-
version = "0.0.
|
7
|
+
version = "0.0.15"
|
8
8
|
description = "Toolset for Vision Agent"
|
9
9
|
authors = ["Landing AI <dev@landing.ai>"]
|
10
10
|
readme = "README.md"
|
@@ -16,7 +16,7 @@ packages = [{include = "vision_agent"}]
|
|
16
16
|
"documentation" = "https://github.com/landing-ai/vision-agent"
|
17
17
|
|
18
18
|
[tool.poetry.dependencies] # main dependency group
|
19
|
-
python = ">=3.10,<
|
19
|
+
python = ">=3.10,<3.12"
|
20
20
|
|
21
21
|
numpy = ">=1.21.0,<2.0.0"
|
22
22
|
pillow = "10.*"
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|