hyperbrowser 0.16.0__py3-none-any.whl → 0.18.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of hyperbrowser might be problematic. Click here for more details.

@@ -0,0 +1,62 @@
1
+ from hyperbrowser.models.crawl import StartCrawlJobParams
2
+ from hyperbrowser.models.scrape import StartScrapeJobParams
3
+ from hyperbrowser import Hyperbrowser, AsyncHyperbrowser
4
+
5
+ from .openai import (
6
+ SCRAPE_TOOL_OPENAI,
7
+ CRAWL_TOOL_OPENAI,
8
+ )
9
+ from .anthropic import (
10
+ SCRAPE_TOOL_ANTHROPIC,
11
+ CRAWL_TOOL_ANTHROPIC,
12
+ )
13
+
14
+
15
+ class WebsiteScrapeTool:
16
+ openai_tool_definition = SCRAPE_TOOL_OPENAI
17
+ anthropic_tool_definition = SCRAPE_TOOL_ANTHROPIC
18
+
19
+ @staticmethod
20
+ def runnable(hb: Hyperbrowser, params: dict) -> str:
21
+ resp = hb.scrape.start_and_wait(params=StartScrapeJobParams(**params))
22
+ return resp.data.markdown if resp.data and resp.data.markdown else ""
23
+
24
+ @staticmethod
25
+ async def async_runnable(hb: AsyncHyperbrowser, params: dict) -> str:
26
+ resp = await hb.scrape.start_and_wait(params=StartScrapeJobParams(**params))
27
+ return resp.data.markdown if resp.data and resp.data.markdown else ""
28
+
29
+
30
+ class WebsiteCrawlTool:
31
+ openai_tool_definition = CRAWL_TOOL_OPENAI
32
+ anthropic_tool_definition = CRAWL_TOOL_ANTHROPIC
33
+
34
+ @staticmethod
35
+ def runnable(hb: Hyperbrowser, params: dict) -> str:
36
+ resp = hb.crawl.start_and_wait(params=StartCrawlJobParams(**params))
37
+ markdown = ""
38
+ if resp.data:
39
+ for page in resp.data:
40
+ if page.markdown:
41
+ markdown += (
42
+ f"\n{'-'*50}\nUrl: {page.url}\nMarkdown:\n{page.markdown}\n"
43
+ )
44
+ return markdown
45
+
46
+ @staticmethod
47
+ async def async_runnable(hb: AsyncHyperbrowser, params: dict) -> str:
48
+ resp = await hb.crawl.start_and_wait(params=StartCrawlJobParams(**params))
49
+ markdown = ""
50
+ if resp.data:
51
+ for page in resp.data:
52
+ if page.markdown:
53
+ markdown += (
54
+ f"\n{'-'*50}\nUrl: {page.url}\nMarkdown:\n{page.markdown}\n"
55
+ )
56
+ return markdown
57
+
58
+
59
+ __all__ = [
60
+ "WebsiteScrapeTool",
61
+ "WebsiteCrawlTool",
62
+ ]
@@ -54,6 +54,7 @@ SCRAPE_TOOL_OPENAI: ChatCompletionToolParam = {
54
54
  "name": "scrape_webpage",
55
55
  "description": "Scrape content from a webpage and return the content in markdown format",
56
56
  "parameters": SCRAPE_SCHEMA,
57
+ "strict": True,
57
58
  },
58
59
  }
59
60
 
@@ -63,5 +64,6 @@ CRAWL_TOOL_OPENAI: ChatCompletionToolParam = {
63
64
  "name": "crawl_website",
64
65
  "description": "Crawl a website and return the content in markdown format",
65
66
  "parameters": CRAWL_SCHEMA,
67
+ "strict": True,
66
68
  },
67
69
  }
@@ -21,6 +21,8 @@ SCRAPE_OPTIONS = {
21
21
  "description": "Whether to only return the main content of the page. If true, only the main content of the page will be returned, excluding any headers, navigation menus,footers, or other non-main content.",
22
22
  },
23
23
  },
24
+ "required": ["include_tags", "exclude_tags", "only_main_content"],
25
+ "additionalProperties": False,
24
26
  }
25
27
 
26
28
  SCRAPE_SCHEMA = {
@@ -32,7 +34,8 @@ SCRAPE_SCHEMA = {
32
34
  },
33
35
  "scrape_options": SCRAPE_OPTIONS,
34
36
  },
35
- "required": ["url"],
37
+ "required": ["url", "scrape_options"],
38
+ "additionalProperties": False,
36
39
  }
37
40
 
38
41
  CRAWL_SCHEMA = {
@@ -44,7 +47,6 @@ CRAWL_SCHEMA = {
44
47
  },
45
48
  "max_pages": {
46
49
  "type": "number",
47
- "default": 10,
48
50
  "description": "The maximum number of pages to crawl",
49
51
  },
50
52
  "follow_links": {
@@ -71,5 +73,14 @@ CRAWL_SCHEMA = {
71
73
  },
72
74
  "scrape_options": SCRAPE_OPTIONS,
73
75
  },
74
- "required": ["url"],
76
+ "required": [
77
+ "url",
78
+ "max_pages",
79
+ "follow_links",
80
+ "ignore_sitemap",
81
+ "exclude_patterns",
82
+ "include_patterns",
83
+ "scrape_options",
84
+ ],
85
+ "additionalProperties": False,
75
86
  }
@@ -1,21 +1,22 @@
1
1
  Metadata-Version: 2.3
2
2
  Name: hyperbrowser
3
- Version: 0.16.0
3
+ Version: 0.18.0
4
4
  Summary: Python SDK for hyperbrowser
5
- Home-page: https://github.com/hyperbrowserai/python-sdk
6
5
  License: MIT
7
6
  Author: Nikhil Shahi
8
7
  Author-email: nshahi1998@gmail.com
9
- Requires-Python: >=3.9,<4.0
8
+ Requires-Python: >=3.8,<4.0
10
9
  Classifier: License :: OSI Approved :: MIT License
11
10
  Classifier: Programming Language :: Python :: 3
11
+ Classifier: Programming Language :: Python :: 3.8
12
12
  Classifier: Programming Language :: Python :: 3.9
13
13
  Classifier: Programming Language :: Python :: 3.10
14
14
  Classifier: Programming Language :: Python :: 3.11
15
15
  Classifier: Programming Language :: Python :: 3.12
16
16
  Classifier: Programming Language :: Python :: 3.13
17
- Requires-Dist: httpx (>=0.28.0,<0.29.0)
18
- Requires-Dist: pydantic (>=2.10.0,<3.0.0)
17
+ Requires-Dist: httpx (>=0.23.0,<1)
18
+ Requires-Dist: pydantic (>=1.9.0,<3)
19
+ Project-URL: Homepage, https://github.com/hyperbrowserai/python-sdk
19
20
  Project-URL: Repository, https://github.com/hyperbrowserai/python-sdk
20
21
  Description-Content-Type: text/markdown
21
22
 
@@ -20,13 +20,14 @@ hyperbrowser/models/extension.py,sha256=nXjKXKt9R7RxyZ4hd3EvfqZsEGy_ufh1r5j2mqCL
20
20
  hyperbrowser/models/profile.py,sha256=SYu4SR6OSwvg0C3bMW3j9z3zhPi-IzXuJE5aVJ3t-Nc,397
21
21
  hyperbrowser/models/scrape.py,sha256=yjoU-w1wvTROp5PYu9vyJUEaeuqYjErtnFkzWxxqgk4,2140
22
22
  hyperbrowser/models/session.py,sha256=nGcepy8j_xfYC3-hj12467pc913Zx952WYa6Cym0kiI,5056
23
+ hyperbrowser/tools/__init__.py,sha256=OUaTUM-kiigYmzfbpx3XQhzMK1xT1wd8cqXgR4znsAY,2021
23
24
  hyperbrowser/tools/anthropic.py,sha256=5pEkJm1H-26GToTwXsDjo4GGqVy1hATws4Pg59mumow,1667
24
- hyperbrowser/tools/openai.py,sha256=eVzWccdwCBJdCTej5t_H48Pqk0oNR2gdToYO5BpE0Mc,2152
25
- hyperbrowser/tools/schema.py,sha256=ONgJG0tNT1NVI1-RdLWqF6DHTQ0xRGp1w6OF8UBrKcE,2740
25
+ hyperbrowser/tools/openai.py,sha256=4-71IIWSxc_ByhywcfWj9-QI9iYNEe0xO6B2spE8WG0,2200
26
+ hyperbrowser/tools/schema.py,sha256=cR2MUX8TvUyN8TnCyeX0pccp4AmPjrdaKzuAXRThOJo,3075
26
27
  hyperbrowser/transport/async_transport.py,sha256=MIPJvilvZWBPXLZ96c9OohuN6TN9DaaU0EnyleG3q6g,4017
27
28
  hyperbrowser/transport/base.py,sha256=ildpMrDiM8nvrSGrH2LTOafmB17T7PQB_NQ1ODA378U,1703
28
29
  hyperbrowser/transport/sync.py,sha256=ER844H_OCPCrnmbc58cuqphWTVvCZJQn7-D7ZenCr3Y,3311
29
- hyperbrowser-0.16.0.dist-info/LICENSE,sha256=6rUGKlyKb_1ZAH7h7YITYAAUNFN3MNGGKCyfrw49NLE,1071
30
- hyperbrowser-0.16.0.dist-info/METADATA,sha256=QLfXYK0clu7vbXCO4X0qmy1QS5gbux1L0T81Y69KFNs,3388
31
- hyperbrowser-0.16.0.dist-info/WHEEL,sha256=RaoafKOydTQ7I_I3JTrPCg6kUmTgtm4BornzOqyEfJ8,88
32
- hyperbrowser-0.16.0.dist-info/RECORD,,
30
+ hyperbrowser-0.18.0.dist-info/LICENSE,sha256=6rUGKlyKb_1ZAH7h7YITYAAUNFN3MNGGKCyfrw49NLE,1071
31
+ hyperbrowser-0.18.0.dist-info/METADATA,sha256=GxrLTW97b-ht751LBX0D9bkwETVWA2jBn0hkcD8WIEQ,3440
32
+ hyperbrowser-0.18.0.dist-info/WHEEL,sha256=IYZQI976HJqqOpQU6PHkJ8fb3tMNBFjg-Cn-pwAbaFM,88
33
+ hyperbrowser-0.18.0.dist-info/RECORD,,
@@ -1,4 +1,4 @@
1
1
  Wheel-Version: 1.0
2
- Generator: poetry-core 2.0.0
2
+ Generator: poetry-core 2.0.1
3
3
  Root-Is-Purelib: true
4
4
  Tag: py3-none-any