PyPI - recent-state-summarizer - Versions diffs - 0.0.2__tar.gz → 0.0.3__tar.gz - Mend

recent-state-summarizer 0.0.2tar.gz → 0.0.3tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of recent-state-summarizer might be problematic. Click here for more details.

Files changed (19) hide show

{recent_state_summarizer-0.0.2/recent_state_summarizer.egg-info → recent_state_summarizer-0.0.3}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: recent-state-summarizer
-Version: 0.0.2
+Version: 0.0.3
 Summary: Summarize a list of entry titles using LLM
 Author-email: nikkie <takuyafjp+develop@gmail.com>
 License: MIT

recent_state_summarizer-0.0.3/recent_state_summarizer/__init__.py ADDED Viewed

	@@ -0,0 +1 @@
1	+ __version__ = "0.0.3"

{recent_state_summarizer-0.0.2 → recent_state_summarizer-0.0.3}/recent_state_summarizer/fetch.py RENAMED Viewed

@@ -31,6 +31,13 @@ def _fetch_titles(url: str) -> Generator[TitleTag, None, None]:
     raw_html = _fetch(url)
     yield from _parse_titles(raw_html)
+    soup = BeautifulSoup(raw_html, "html.parser")
+    next_link = soup.find("a", class_="test-pager-next")
+    if next_link and "href" in next_link.attrs:
+        next_url = next_link["href"]
+        print(f"Next page found, fetching... {next_url}")
+        yield from _fetch_titles(next_url)
 def _fetch(url: str) -> str:
     with urlopen(url) as res:

{recent_state_summarizer-0.0.2 → recent_state_summarizer-0.0.3/recent_state_summarizer.egg-info}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: recent-state-summarizer
-Version: 0.0.2
+Version: 0.0.3
 Summary: Summarize a list of entry titles using LLM
 Author-email: nikkie <takuyafjp+develop@gmail.com>
 License: MIT

recent_state_summarizer-0.0.3/tests/test_fetch.py ADDED Viewed

@@ -0,0 +1,150 @@
+import pytest
+from recent_state_summarizer.fetch import _main
+@pytest.fixture
+def blog_server(httpserver):
+    httpserver.expect_request("/archive/2025/06").respond_with_data(
+        f"""\
+<!DOCTYPE html>
+<html>
+  <head><title>Archive</title></head>
+  <body>
+    <h1>Archive</h1>
+    <div id="content">
+      <div id="content-inner">
+        <div id="wrapper">
+          <div id="main">
+            <div id="main-inner">
+              <div class="archive-entries">
+                <section class="archive-entry">
+                  <a class="entry-title-link" href="{httpserver.url_for('/')}archive/2025/06/03">Title 3</a>
+                </section>
+                <section class="archive-entry">
+                  <a class="entry-title-link" href="{httpserver.url_for('/')}archive/2025/06/02">Title 2</a>
+                </section>
+                <section class="archive-entry">
+                  <a class="entry-title-link" href="{httpserver.url_for('/')}archive/2025/06/01">Title 1</a>
+                </section>
+              </div>
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </body>
+</html>"""
+    )
+    return httpserver
+def test_fetch_as_bullet_list(blog_server, tmp_path):
+    _main(
+        blog_server.url_for("/archive/2025/06"),
+        tmp_path / "titles.txt",
+        save_as_json=False,
+    )
+    expected = """\
+- Title 3
+- Title 2
+- Title 1"""
+    assert (tmp_path / "titles.txt").read_text(encoding="utf8") == expected
+def test_fetch_as_json(blog_server, tmp_path):
+    _main(
+        blog_server.url_for("/archive/2025/06"),
+        tmp_path / "titles.json",
+        save_as_json=True,
+    )
+    expected = f"""\
+{{"title": "Title 3", "url": "{blog_server.url_for('/archive/2025/06/03')}"}}
+{{"title": "Title 2", "url": "{blog_server.url_for('/archive/2025/06/02')}"}}
+{{"title": "Title 1", "url": "{blog_server.url_for('/archive/2025/06/01')}"}}"""
+    assert (tmp_path / "titles.json").read_text(encoding="utf8") == expected
+@pytest.fixture
+def multi_page_blog_server(httpserver):
+    httpserver.expect_request(
+        "/archive/2025/07", query_string="page=2"
+    ).respond_with_data(
+        f"""\
+<!DOCTYPE html>
+<html>
+  <head><title>Archive (Page 2)</title></head>
+  <body>
+    <h1>Archive</h1>
+    <div id="content">
+      <div id="content-inner">
+        <div id="wrapper">
+          <div id="main">
+            <div id="main-inner">
+              <div class="archive-entries">
+                <section class="archive-entry">
+                  <a class="entry-title-link" href="{httpserver.url_for('/')}archive/2025/07/01">Title 1</a>
+                </section>
+              </div>
+              <div class="pager">
+                <span class="pager-prev">
+                  <a href="{httpserver.url_for('/')}archive/2025/07" class="test-pager-prev" rel="prev">前のページ</a>
+                </span>
+              </div>
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </body>
+</html>"""
+    )
+    httpserver.expect_request("/archive/2025/07").respond_with_data(
+        f"""\
+<!DOCTYPE html>
+<html>
+  <head><title>Archive</title></head>
+  <body>
+    <h1>Archive</h1>
+    <div id="content">
+      <div id="content-inner">
+        <div id="wrapper">
+          <div id="main">
+            <div id="main-inner">
+              <div class="archive-entries">
+                <section class="archive-entry">
+                  <a class="entry-title-link" href="{httpserver.url_for('/')}archive/2025/07/03">Title 3</a>
+                </section>
+                <section class="archive-entry">
+                  <a class="entry-title-link" href="{httpserver.url_for('/')}archive/2025/07/02">Title 2</a>
+                </section>
+              </div>
+            </div>
+            <div class="pager">
+              <span class="pager-next">
+                <a href="{httpserver.url_for('/')}archive/2025/07?page=2" class="test-pager-next" rel="next">次のページ</a>
+              </span>
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </body>
+</html>"""
+    )
+    return httpserver
+def test_fetch_multiple_archive_page(multi_page_blog_server, tmp_path):
+    _main(
+        multi_page_blog_server.url_for("/archive/2025/07"),
+        tmp_path / "titles.txt",
+        save_as_json=False,
+    )
+    expected = """- Title 3
+- Title 2
+- Title 1"""
+    assert (tmp_path / "titles.txt").read_text(encoding="utf8") == expected

recent_state_summarizer-0.0.2/recent_state_summarizer/__init__.py DELETED Viewed

	@@ -1 +0,0 @@
1	- __version__ = "0.0.2"

recent_state_summarizer-0.0.2/tests/test_fetch.py DELETED Viewed

@@ -1,64 +0,0 @@
-from textwrap import dedent
-import pytest
-from recent_state_summarizer.fetch import _main
-@pytest.fixture
-def blog_server(httpserver):
-    httpserver.expect_request("/archive/2025/06").respond_with_data(
-        dedent(
-            f"""
-        <!DOCTYPE html>
-        <html>
-          <head><title>Archive</title></head>
-          <body>
-            <h1>Archive</h1>
-            <div id="content">
-              <div class="archive-entries">
-                <section class="archive-entry">
-                  <a class="entry-title-link" href="{httpserver.url_for('/')}archive/2025/06/03">Title 3</a>
-                </section>
-                <section class="archive-entry">
-                  <a class="entry-title-link" href="{httpserver.url_for('/')}archive/2025/06/02">Title 2</a>
-                </section>
-                <section class="archive-entry">
-                  <a class="entry-title-link" href="{httpserver.url_for('/')}archive/2025/06/01">Title 1</a>
-                </section>
-              </div>
-            </div>
-          </body>
-        </html>
-        """
-        )
-    )
-    return httpserver
-def test_fetch_as_bullet_list(blog_server, tmp_path):
-    _main(
-        blog_server.url_for("/archive/2025/06"),
-        tmp_path / "titles.txt",
-        save_as_json=False,
-    )
-    expected = """\
-- Title 3
-- Title 2
-- Title 1"""
-    assert (tmp_path / "titles.txt").read_text(encoding="utf8") == expected
-def test_fetch_as_json(blog_server, tmp_path):
-    _main(
-        blog_server.url_for("/archive/2025/06"),
-        tmp_path / "titles.json",
-        save_as_json=True,
-    )
-    expected = f"""\
-{{"title": "Title 3", "url": "{blog_server.url_for('/archive/2025/06/03')}"}}
-{{"title": "Title 2", "url": "{blog_server.url_for('/archive/2025/06/02')}"}}
-{{"title": "Title 1", "url": "{blog_server.url_for('/archive/2025/06/01')}"}}"""
-    assert (tmp_path / "titles.json").read_text(encoding="utf8") == expected