academia-mcp 1.10.6__py3-none-any.whl → 1.10.8__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
academia_mcp/server.py CHANGED
@@ -42,6 +42,7 @@ from academia_mcp.tools.bitflip import (
42
42
  from academia_mcp.tools.review import review_pdf_paper, download_pdf_paper
43
43
  from academia_mcp.tools.show_image import show_image, describe_image
44
44
  from academia_mcp.tools.speech_to_text import speech_to_text
45
+ from academia_mcp.tools.yt_transcript import yt_transcript
45
46
 
46
47
 
47
48
  def configure_uvicorn_style_logging(level: int = logging.INFO) -> None:
@@ -92,6 +93,7 @@ def run(
92
93
  server.add_tool(get_latex_templates_list)
93
94
  server.add_tool(visit_webpage)
94
95
  server.add_tool(show_image)
96
+ server.add_tool(yt_transcript)
95
97
 
96
98
  if settings.WORKSPACE_DIR:
97
99
  server.add_tool(compile_latex)
academia_mcp/settings.py CHANGED
@@ -21,6 +21,9 @@ class Settings(BaseSettings):
21
21
  DOCUMENT_QA_DOCUMENT_MAX_LENGTH: int = 200000
22
22
  DESCRIBE_IMAGE_MODEL_NAME: str = "gpt-4.1"
23
23
 
24
+ WEBSHARE_PROXY_USERNAME: Optional[str] = None
25
+ WEBSHARE_PROXY_PASSWORD: Optional[str] = None
26
+
24
27
  PORT: int = 5056
25
28
  WORKSPACE_DIR: Optional[Path] = None
26
29
 
@@ -16,6 +16,7 @@ from .bitflip import extract_bitflip_info, generate_research_proposals, score_re
16
16
  from .review import review_pdf_paper, download_pdf_paper, review_pdf_paper_by_url
17
17
  from .show_image import show_image, describe_image
18
18
  from .speech_to_text import speech_to_text
19
+ from .yt_transcript import yt_transcript
19
20
 
20
21
  __all__ = [
21
22
  "arxiv_search",
@@ -45,4 +46,5 @@ __all__ = [
45
46
  "show_image",
46
47
  "describe_image",
47
48
  "speech_to_text",
49
+ "yt_transcript",
48
50
  ]
@@ -1,5 +1,5 @@
1
1
  import json
2
- from typing import Optional, List
2
+ from typing import Optional, List, Tuple
3
3
 
4
4
  from academia_mcp.utils import post_with_retries, get_with_retries
5
5
  from academia_mcp.settings import settings
@@ -12,6 +12,24 @@ BRAVE_SEARCH_URL = "https://api.search.brave.com/res/v1/web/search"
12
12
  EXCLUDE_DOMAINS = ["chatpaper.com"]
13
13
 
14
14
 
15
+ def _parse_domains(query: str) -> Tuple[str, List[str]]:
16
+ site_term = "site:"
17
+ if site_term not in query:
18
+ return query, []
19
+ parts = query.split()
20
+ query_parts = []
21
+ include_domains = []
22
+ for part in parts:
23
+ if not part.startswith(site_term):
24
+ query_parts.append(part)
25
+ continue
26
+ domain = part[len(site_term) :]
27
+ if domain:
28
+ include_domains.append(domain)
29
+ query = " ".join(query_parts)
30
+ return query, include_domains
31
+
32
+
15
33
  def web_search(
16
34
  query: str,
17
35
  limit: Optional[int] = 20,
@@ -40,6 +58,13 @@ def web_search(
40
58
  isinstance(domain, str) for domain in include_domains
41
59
  ), "Error: include_domains should be a list of strings"
42
60
 
61
+ query, query_include_domains = _parse_domains(query)
62
+ if query_include_domains:
63
+ if include_domains:
64
+ include_domains.extend(query_include_domains)
65
+ else:
66
+ include_domains = query_include_domains
67
+
43
68
  is_tavily_available = bool(settings.TAVILY_API_KEY)
44
69
  is_exa_available = bool(settings.EXA_API_KEY)
45
70
  is_brave_available = bool(settings.BRAVE_API_KEY)
@@ -0,0 +1,30 @@
1
+ from youtube_transcript_api import YouTubeTranscriptApi
2
+ from youtube_transcript_api.proxies import WebshareProxyConfig
3
+
4
+ from academia_mcp.settings import settings
5
+
6
+
7
+ def yt_transcript(video_url: str) -> str:
8
+ """
9
+ Tool to fetch the transcript of a YouTube video given its URL.
10
+
11
+ Returns a transcript of the video as a single string.
12
+
13
+ Args:
14
+ video_url (str): YouTube video URL.
15
+ """
16
+ if "youtu.be" in video_url:
17
+ video_id = video_url.strip().split("youtu.be/")[1]
18
+ else:
19
+ video_id = video_url.strip().split("v=")[-1]
20
+ video_id = video_id.split("?")[0]
21
+ proxy_config = None
22
+ if settings.WEBSHARE_PROXY_USERNAME and settings.WEBSHARE_PROXY_PASSWORD:
23
+ proxy_config = WebshareProxyConfig(
24
+ proxy_username=settings.WEBSHARE_PROXY_USERNAME,
25
+ proxy_password=settings.WEBSHARE_PROXY_PASSWORD,
26
+ )
27
+ api = YouTubeTranscriptApi(proxy_config=proxy_config)
28
+ transcript = api.fetch(video_id)
29
+ snippets = transcript.snippets
30
+ return "\n".join([f"{int(entry.start)}: {' '.join(entry.text.split())}" for entry in snippets])
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: academia-mcp
3
- Version: 1.10.6
3
+ Version: 1.10.8
4
4
  Summary: MCP server that provides different tools to search for scientific publications
5
5
  Author-email: Ilya Gusev <phoenixilya@gmail.com>
6
6
  Project-URL: Homepage, https://github.com/IlyaGusev/academia_mcp
@@ -30,6 +30,7 @@ Requires-Dist: datasets>=4.0.0
30
30
  Requires-Dist: pymupdf>=1.26.4
31
31
  Requires-Dist: pillow>=11.3.0
32
32
  Requires-Dist: pydantic-settings>=2.6.0
33
+ Requires-Dist: youtube-transcript-api>=1.2.2
33
34
  Dynamic: license-file
34
35
 
35
36
  # Academia MCP
@@ -4,12 +4,12 @@ academia_mcp/files.py,sha256=ynIt0XbU1Z7EPWkv_hVX0pGKsLlmjYv-MVJLOfi6yzs,817
4
4
  academia_mcp/llm.py,sha256=zpGkuJFf58Ofgys_fi28-47_wJ1a7sIs_yZvI1Si6z0,993
5
5
  academia_mcp/pdf.py,sha256=9PlXzHGhb6ay3ldbTdxCcTWvH4TkET3bnb64mgoh9i0,1273
6
6
  academia_mcp/py.typed,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
7
- academia_mcp/server.py,sha256=hNfQSFwgbVMNyB7ElGpJ0RCTGeRP7jb5--7KZmG8cW8,5423
8
- academia_mcp/settings.py,sha256=MSQYjmhZ3NDalTzu4z3ey1Aw60TrhkDcPWUTE4-iOaU,995
7
+ academia_mcp/server.py,sha256=tZ57YkW2EcW4DRIk87n2PFZkkTjAVsVQ5lphvc1AVA4,5517
8
+ academia_mcp/settings.py,sha256=c5s4dI8V_cWmMED-jKDmHjfdIaBcxwEK4HdHNQ3WUIg,1096
9
9
  academia_mcp/utils.py,sha256=lRlb615JJ_0d4gcFpMoBjB6w0xXcde9dFDw0LwYpSPQ,4863
10
10
  academia_mcp/latex_templates/agents4science_2025/agents4science_2025.sty,sha256=hGcEPCYBJS4vdhWvN_yEaJC4GvT_yDroI94CfY2Oguk,12268
11
11
  academia_mcp/latex_templates/agents4science_2025/agents4science_2025.tex,sha256=Tl1QkHXHRopw9VEfWrD3Layr5JP_0gIzVQjL4KXIWqc,15814
12
- academia_mcp/tools/__init__.py,sha256=lGUy5C4IymplHOXqOiwDD7CT4Z8aPHJqSxXo2g9qkks,1493
12
+ academia_mcp/tools/__init__.py,sha256=Z30vULZwUeUX5nDz5wcv0znhAeBtZRa0dvz7vD8SUYE,1555
13
13
  academia_mcp/tools/anthology_search.py,sha256=rhFpJZqGLABgr0raDuH0CARBiAJNJtEI4dlMrKNHfDQ,7669
14
14
  academia_mcp/tools/arxiv_download.py,sha256=gBY0_Kz0yGtVkLMwn6GrAyfBjovZVgcSMuyy67p65Cw,10474
15
15
  academia_mcp/tools/arxiv_search.py,sha256=pzM18qrF3QL03A53w003kE7hQi3s3QKtjgw0m7K88UY,8355
@@ -23,10 +23,11 @@ academia_mcp/tools/s2.py,sha256=QX7-pbetab3Xt_1tvVPU6o5D_NAe9y6jcTGRBK1vwtY,6200
23
23
  academia_mcp/tools/show_image.py,sha256=jiJlQ53dbZ0T61OBhCT3IKVvBl9NHc6jHgWLfg5BxiE,3856
24
24
  academia_mcp/tools/speech_to_text.py,sha256=YZzMqdvunzXkpcadP_mYhm6cs4qH1Y_42SfY-7eX4O4,1601
25
25
  academia_mcp/tools/visit_webpage.py,sha256=swlFwWRzWc7-AHP2ouRZJScSTA4dHZ32fuJnA2V0lUc,3311
26
- academia_mcp/tools/web_search.py,sha256=2haTqnWkoISWS7VZSI0h7mW-jjWFItA8SL1FkkUxzI8,7864
27
- academia_mcp-1.10.6.dist-info/licenses/LICENSE,sha256=xx0jnfkXJvxRnG63LTGOxlggYnIysveWIZ6H3PNdCrQ,11357
28
- academia_mcp-1.10.6.dist-info/METADATA,sha256=pwPpp2xupjkVubi5Yt6JQqknFserzyRn-0xc2MGsIYI,6311
29
- academia_mcp-1.10.6.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
30
- academia_mcp-1.10.6.dist-info/entry_points.txt,sha256=gxkiKJ74w2FwJpSECpjA3XtCfI5ZfrM6N8cqnwsq4yY,51
31
- academia_mcp-1.10.6.dist-info/top_level.txt,sha256=CzGpRFsRRJRqWEb1e3SUlcfGqRzOxevZGaJWrtGF8W0,13
32
- academia_mcp-1.10.6.dist-info/RECORD,,
26
+ academia_mcp/tools/web_search.py,sha256=VphVztf2jZNT3bPJPJuTdMkKbe2-LIbSV7keKV47lac,8616
27
+ academia_mcp/tools/yt_transcript.py,sha256=NPBVGN-LG_N6yElQYBMEnbNhSjkM3-DPeVIJwlFGqA0,1104
28
+ academia_mcp-1.10.8.dist-info/licenses/LICENSE,sha256=xx0jnfkXJvxRnG63LTGOxlggYnIysveWIZ6H3PNdCrQ,11357
29
+ academia_mcp-1.10.8.dist-info/METADATA,sha256=Cw-6atEo6S0MAjBKkgsHZxw-GJCcTZWAiOSQGeftarM,6356
30
+ academia_mcp-1.10.8.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
31
+ academia_mcp-1.10.8.dist-info/entry_points.txt,sha256=gxkiKJ74w2FwJpSECpjA3XtCfI5ZfrM6N8cqnwsq4yY,51
32
+ academia_mcp-1.10.8.dist-info/top_level.txt,sha256=CzGpRFsRRJRqWEb1e3SUlcfGqRzOxevZGaJWrtGF8W0,13
33
+ academia_mcp-1.10.8.dist-info/RECORD,,