PyPI - tumblrbot - Versions diffs - 1.4.6__py3-none-any.whl → 1.4.7__py3-none-any.whl - Mend

tumblrbot 1.4.6py3-none-any.whl → 1.4.7py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (13) hide show

tumblrbot/__main__.py +1 -1
tumblrbot/flow/download.py +1 -1
tumblrbot/flow/examples.py +2 -2
tumblrbot/flow/fine_tune.py +2 -2
tumblrbot/utils/common.py +3 -3
tumblrbot/utils/models.py +99 -16
tumblrbot/utils/tumblr.py +1 -2
{tumblrbot-1.4.6.dist-info → tumblrbot-1.4.7.dist-info}/METADATA +3 -5
tumblrbot-1.4.7.dist-info/RECORD +15 -0
tumblrbot/utils/config.py +0 -97
tumblrbot-1.4.6.dist-info/RECORD +0 -16
{tumblrbot-1.4.6.dist-info → tumblrbot-1.4.7.dist-info}/WHEEL +0 -0
{tumblrbot-1.4.6.dist-info → tumblrbot-1.4.7.dist-info}/entry_points.txt +0 -0

tumblrbot/__main__.py CHANGED Viewed

@@ -14,7 +14,7 @@ from tumblrbot.utils.tumblr import TumblrSession
 def main() -> None:
     install()
-    tokens = Tokens.read_from_keyring()
+    tokens = Tokens.load()
     with OpenAI(api_key=tokens.openai_api_key) as openai, TumblrSession(tokens) as tumblr:
         if Confirm.ask("Download latest posts?", default=False):
             PostDownloader(openai=openai, tumblr=tumblr).main()

tumblrbot/flow/download.py CHANGED Viewed

@@ -18,7 +18,7 @@ class PostDownloader(FlowClass):
                 completed = 0
                 after = 0
                 if data_path.exists():
-                    lines = data_path.read_text("utf_8").splitlines() if data_path.exists() else []
+                    lines = data_path.read_bytes().splitlines() if data_path.exists() else []
                     completed = len(lines)
                     if lines:
                         after = Post.model_validate_json(lines[-1]).timestamp

tumblrbot/flow/examples.py CHANGED Viewed

@@ -49,7 +49,7 @@ class ExamplesWriter(FlowClass):
         self.config.custom_prompts_file.parent.mkdir(parents=True, exist_ok=True)
         self.config.custom_prompts_file.touch(exist_ok=True)
-        with self.config.custom_prompts_file.open("r", encoding="utf_8") as fp:
+        with self.config.custom_prompts_file.open("rb") as fp:
             for line in fp:
                 data: dict[str, str] = loads(line)
                 yield from data.items()
@@ -81,7 +81,7 @@ class ExamplesWriter(FlowClass):
     def get_valid_posts(self) -> Generator[Post]:
         for data_path in self.get_data_paths():
-            with data_path.open(encoding="utf_8") as fp:
+            with data_path.open("rb") as fp:
                 for line in fp:
                     post = Post.model_validate_json(line)
                     if post.valid_text_post():

tumblrbot/flow/fine_tune.py CHANGED Viewed

@@ -98,8 +98,8 @@ class FineTuner(FlowClass):
             if job.status == "failed" and job.error is not None:
                 raise RuntimeError(job.error.message)
-        if job.fine_tuned_model:
-            self.config.fine_tuned_model = job.fine_tuned_model or ""
+        if job.fine_tuned_model is not None:
+            self.config.fine_tuned_model = job.fine_tuned_model
     def print_estimates(self) -> None:
         estimated_tokens = sum(self.count_tokens())

tumblrbot/utils/common.py CHANGED Viewed

@@ -1,4 +1,5 @@
 from abc import abstractmethod
+from pathlib import Path
 from random import choice
 from typing import ClassVar, Self, override
@@ -10,15 +11,14 @@ from rich.live import Live
 from rich.progress import MofNCompleteColumn, Progress, SpinnerColumn, TimeElapsedColumn
 from rich.table import Table
-from tumblrbot.utils.config import Config, Path
-from tumblrbot.utils.models import FullyValidatedModel
+from tumblrbot.utils.models import Config, FullyValidatedModel
 from tumblrbot.utils.tumblr import TumblrSession
 class FlowClass(FullyValidatedModel):
     model_config = ConfigDict(arbitrary_types_allowed=True)
-    config: ClassVar = Config()  # pyright: ignore[reportCallIssue]
+    config: ClassVar = Config.load()
     openai: OpenAI
     tumblr: TumblrSession

tumblrbot/utils/models.py CHANGED Viewed

@@ -1,15 +1,20 @@
+import tomllib
+from abc import abstractmethod
 from collections.abc import Generator
+from pathlib import Path
 from typing import Annotated, Any, ClassVar, Literal, Self, override
 import rich
+import tomlkit
 from keyring import get_password, set_password
-from openai import BaseModel
+from openai.types import ChatModel
 from pwinput import pwinput
-from pydantic import ConfigDict, PlainSerializer
+from pydantic import BaseModel, ConfigDict, Field, NonNegativeFloat, PlainSerializer, PositiveFloat, PositiveInt, model_validator
 from pydantic.json_schema import SkipJsonSchema
 from requests_oauthlib import OAuth1Session
 from rich.panel import Panel
-from rich.prompt import Confirm
+from rich.prompt import Confirm, Prompt
+from tomlkit import comment, document
 class FullyValidatedModel(BaseModel):
@@ -22,7 +27,85 @@ class FullyValidatedModel(BaseModel):
     )
-class Tokens(FullyValidatedModel):
+class FileSyncSettings(FullyValidatedModel):
+    @classmethod
+    @abstractmethod
+    def read(cls) -> Self | dict[str, object] | str | None: ...
+    @classmethod
+    def load(cls) -> Self:
+        data = cls.read() or {}
+        return cls.model_validate_json(data) if isinstance(data, str) else cls.model_validate(data)
+    @model_validator(mode="after")
+    @abstractmethod
+    def write(self) -> Self: ...
+class Config(FileSyncSettings):
+    toml_file: ClassVar = Path("config.toml")
+    # Downloading Posts & Writing Examples
+    download_blog_identifiers: list[str] = Field([], description="The identifiers of the blogs which post data will be downloaded from. These must be blogs associated with the same account as the configured Tumblr secret tokens.")
+    data_directory: Path = Field(Path("data"), description="Where to store downloaded post data.")
+    # Writing Examples
+    max_moderation_batch_size: PositiveInt = Field(100, description="How many posts, at most, to submit to the OpenAI moderation API. This is also capped by the API.")
+    custom_prompts_file: Path = Field(Path("custom_prompts.jsonl"), description="Where to read in custom prompts from.")
+    # Writing Examples & Fine-Tuning
+    examples_file: Path = Field(Path("examples.jsonl"), description="Where to output the examples that will be used to fine-tune the model.")
+    # Writing Examples & Generating
+    developer_message: str = Field("You are a Tumblr post bot. Please generate a Tumblr post in accordance with the user's request.", description="The developer message used by the OpenAI API to generate drafts.")
+    user_message: str = Field("Please write a comical Tumblr post.", description="The user input used by the OpenAI API to generate drafts.")
+    # Fine-Tuning
+    expected_epochs: PositiveInt = Field(3, description="The expected number of epochs fine-tuning will be run for. This will be updated during fine-tuning.")
+    token_price: PositiveFloat = Field(3, description="The expected price in USD per million tokens during fine-tuning for the current model.")
+    job_id: str = Field("", description="The fine-tuning job ID that will be polled on next run.")
+    # Fine-Tuning & Generating
+    base_model: ChatModel = Field("gpt-4o-mini-2024-07-18", description="The name of the model that will be fine-tuned by the generated training data.")
+    fine_tuned_model: str = Field("", description="The name of the OpenAI model that was fine-tuned with your posts.")
+    # Generating
+    upload_blog_identifier: str = Field("", description="The identifier of the blog which generated drafts will be uploaded to. This must be a blog associated with the same account as the configured Tumblr secret tokens.")
+    draft_count: PositiveInt = Field(150, description="The number of drafts to process. This will affect the number of tokens used with OpenAI")
+    tags_chance: NonNegativeFloat = Field(0.1, description="The chance to generate tags for any given post. This will incur extra calls to OpenAI.")
+    tags_developer_message: str = Field("You will be provided with a block of text, and your task is to extract a very short list of the most important subjects from it.", description="The developer message used to generate tags.")
+    @classmethod
+    @override
+    def read(cls) -> dict[str, object] | None:
+        return tomllib.loads(cls.toml_file.read_text("utf_8")) if cls.toml_file.exists() else None
+    @model_validator(mode="after")
+    @override
+    def write(self) -> Self:
+        if not self.download_blog_identifiers:
+            rich.print("Enter the [cyan]identifiers of your blogs[/] that data should be [bold purple]downloaded[/] from, separated by commas.")
+            self.download_blog_identifiers = list(map(str.strip, Prompt.ask("[bold][Example] [dim]staff.tumblr.com,changes").split(",")))
+        if not self.upload_blog_identifier:
+            rich.print("Enter the [cyan]identifier of your blog[/] that drafts should be [bold purple]uploaded[/] to.")
+            self.upload_blog_identifier = Prompt.ask("[bold][Example] [dim]staff.tumblr.com or changes").strip()
+        toml_table = document()
+        for (name, field), value in zip(self.__class__.model_fields.items(), self.model_dump(mode="json").values(), strict=True):
+            if field.description is not None:
+                for line in field.description.split(". "):
+                    toml_table.add(comment(f"{line.removesuffix('.')}."))
+            toml_table[name] = value
+        Path(self.toml_file).write_text(tomlkit.dumps(toml_table), encoding="utf_8")
+        return self
+class Tokens(FileSyncSettings):
     class Tumblr(FullyValidatedModel):
         client_key: str = ""
         client_secret: str = ""
@@ -50,15 +133,13 @@ class Tokens(FullyValidatedModel):
         rich.print()
     @classmethod
-    def read_from_keyring(cls) -> Self:
-        if json_data := get_password(cls.service_name, cls.username):
-            return cls.model_validate_json(json_data)
-        return cls()
     @override
-    def model_post_init(self, context: object) -> None:
-        super().model_post_init(context)
+    def read(cls) -> str | None:
+        return get_password(cls.service_name, cls.username)
+    @model_validator(mode="after")
+    @override
+    def write(self) -> Self:
         if not self.openai_api_key or Confirm.ask("Reset OpenAI API key?", default=False):
             (self.openai_api_key,) = self.online_token_prompt("https://platform.openai.com/api-keys", "API key")
@@ -86,20 +167,22 @@ class Tokens(FullyValidatedModel):
         set_password(self.service_name, self.username, self.model_dump_json())
+        return self
 class Post(FullyValidatedModel):
     class Block(FullyValidatedModel):
         type: str = "text"
         text: str = ""
-        blocks: list[int] = []  # noqa: RUF012
+        blocks: list[int] = []
     timestamp: SkipJsonSchema[int] = 0
-    tags: Annotated[list[str], PlainSerializer(",".join)] = []  # noqa: RUF012
+    tags: Annotated[list[str], PlainSerializer(",".join)] = []
     state: SkipJsonSchema[Literal["published", "queued", "draft", "private", "unapproved"]] = "draft"
-    content: SkipJsonSchema[list[Block]] = []  # noqa: RUF012
-    layout: SkipJsonSchema[list[Block]] = []  # noqa: RUF012
-    trail: SkipJsonSchema[list[Any]] = []  # noqa: RUF012
+    content: SkipJsonSchema[list[Block]] = []
+    layout: SkipJsonSchema[list[Block]] = []
+    trail: SkipJsonSchema[list[Any]] = []
     is_submission: SkipJsonSchema[bool] = False

tumblrbot/utils/tumblr.py CHANGED Viewed

@@ -19,8 +19,7 @@ class TumblrSession(OAuth1Session):
         try:
             response.raise_for_status()
         except HTTPError as error:
-            if response.text:
-                error.add_note(response.text)
+            error.add_note(response.text)
             raise
     def retrieve_published_posts(self, blog_identifier: str, after: int) -> Response:

{tumblrbot-1.4.6.dist-info → tumblrbot-1.4.7.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: tumblrbot
-Version: 1.4.6
+Version: 1.4.7
 Summary: An updated bot that posts to Tumblr, based on your very own blog!
 Requires-Python: >= 3.13
 Description-Content-Type: text/markdown
@@ -8,13 +8,12 @@ Requires-Dist: keyring
 Requires-Dist: openai
 Requires-Dist: pwinput
 Requires-Dist: pydantic
-Requires-Dist: pydantic-settings
 Requires-Dist: requests
 Requires-Dist: requests-oauthlib
 Requires-Dist: rich
 Requires-Dist: tiktoken
 Requires-Dist: tomlkit
-Project-URL: Source, https://github.com/MaidThatPrograms/tumblrbot
+Project-URL: Source, https://github.com/MaidScientistIzutsumiMarin/tumblrbot
 # tumblrbot
@@ -57,7 +56,6 @@ Features:
 - An [interactive console][Main] for all steps of generating posts for the blog:
    1. Asks for [OpenAI] and [Tumblr] tokens.
       - Stores API tokens using [keyring].
-      - Prevents API tokens from printing to the console.
    1. Retrieves [Tumblr] [OAuth] tokens.
    1. [Downloads posts][Download] from the [configured][config] [Tumblr] blogs.
       - Skips redownloading already downloaded posts.
@@ -67,8 +65,8 @@ Features:
       - Filters out any posts flagged by the [OpenAI] [Moderation API] (optional).
          - Shows progress and previews the current post.
       - Adds custom user messages and assistant responses to the dataset from the [configured][config] file.
-   1. Provides cost estimates if the currently saved examples are used to fine-tune the [configured][config] model.
    1. [Uploads examples][Fine-Tune] to [OpenAI] and begins the fine-tuning process.
+      - Provides cost estimates if the currently saved examples are used to fine-tune the [configured][config] model.
       - Resumes monitoring the same fine-tuning process when restarted.
       - Deletes the uploaded examples file if fine-tuning does not succeed (optional).
       - Stores the output model automatically when fine-tuning is completed.

tumblrbot-1.4.7.dist-info/RECORD ADDED Viewed

@@ -0,0 +1,15 @@
+tumblrbot/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
+tumblrbot/__main__.py,sha256=BenjVNlVZDy-ZlSWukEIguGLa6qXvZjhYSSWMqa8-0Q,1447
+tumblrbot/flow/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
+tumblrbot/flow/download.py,sha256=wdXmtCnnArn8Zw7D2Hoa_KhH-k61j9w3cbYztgBkUlY,2036
+tumblrbot/flow/examples.py,sha256=Th6vgiu3D2VloOx7otZlk164h3ifkJEwDk21YHMEYP0,3976
+tumblrbot/flow/fine_tune.py,sha256=YDukEwZNw3GveEAH4ORv6oylka5MQNLK_4iSmuAVPtg,5387
+tumblrbot/flow/generate.py,sha256=Q6nUtmoj28-rGUCs4V0fuovJshvFMlmipyu9GGqnmzM,2147
+tumblrbot/utils/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
+tumblrbot/utils/common.py,sha256=RvICPORtBSqsN7VWADgStogJ8w4owzBfR1E2XbCQrfA,1795
+tumblrbot/utils/models.py,sha256=Z0k16qJsZEO8tfmPp7X3edz-RgGCDLRSm7HrSDLGh1Y,9663
+tumblrbot/utils/tumblr.py,sha256=6V9AjT-dyR2vuUkfqgqs52Ua5irhQJzhgQhV54xKyGM,1258
+tumblrbot-1.4.7.dist-info/entry_points.txt,sha256=lTiN7PxAbyGY1fpCWApEw6NUIUgobfcOKhvn6cu3IQA,53
+tumblrbot-1.4.7.dist-info/WHEEL,sha256=G2gURzTEtmeR8nrdXUJfNiB3VYVxigPQ-bEQujpNiNs,82
+tumblrbot-1.4.7.dist-info/METADATA,sha256=q_PH1oU-d0PRdXDuL5Bjh-Y8gccZJVvLCCho2E_CLvc,10104
+tumblrbot-1.4.7.dist-info/RECORD,,

tumblrbot/utils/config.py DELETED Viewed

@@ -1,97 +0,0 @@
-from collections.abc import Sequence
-from pathlib import Path
-from typing import TYPE_CHECKING, Self, override
-import rich
-import tomlkit
-from openai.types import ChatModel
-from pydantic import Field, NonNegativeFloat, PositiveFloat, PositiveInt, model_validator
-from pydantic_settings import BaseSettings, PydanticBaseSettingsSource, SettingsConfigDict, TomlConfigSettingsSource
-from rich.prompt import Prompt
-from tomlkit import comment, document
-if TYPE_CHECKING:
-    from _typeshed import StrPath
-class Config(BaseSettings):
-    model_config = SettingsConfigDict(
-        extra="ignore",
-        validate_assignment=True,
-        validate_return=True,
-        validate_by_name=True,
-        cli_parse_args=True,
-        cli_avoid_json=True,
-        cli_kebab_case=True,
-        toml_file="config.toml",
-    )
-    # Downloading Posts & Writing Examples
-    download_blog_identifiers: list[str] = Field([], description="The identifiers of the blogs which post data will be downloaded from. These must be blogs associated with the same account as the configured Tumblr secret tokens.")
-    data_directory: Path = Field(Path("data"), description="Where to store downloaded post data.")
-    # Writing Examples
-    max_moderation_batch_size: PositiveInt = Field(100, description="How many posts, at most, to submit to the OpenAI moderation API. This is also capped by the API.")
-    custom_prompts_file: Path = Field(Path("custom_prompts.jsonl"), description="Where to read in custom prompts from.")
-    # Writing Examples & Fine-Tuning
-    examples_file: Path = Field(Path("examples.jsonl"), description="Where to output the examples that will be used to fine-tune the model.")
-    # Writing Examples & Generating
-    developer_message: str = Field("You are a Tumblr post bot. Please generate a Tumblr post in accordance with the user's request.", description="The developer message used by the OpenAI API to generate drafts.")
-    user_message: str = Field("Please write a comical Tumblr post.", description="The user input used by the OpenAI API to generate drafts.")
-    # Fine-Tuning
-    expected_epochs: PositiveInt = Field(3, description="The expected number of epochs fine-tuning will be run for. This will be updated during fine-tuning.")
-    token_price: PositiveFloat = Field(3, description="The expected price in USD per million tokens during fine-tuning for the current model.")
-    job_id: str = Field("", description="The fine-tuning job ID that will be polled on next run.")
-    # Fine-Tuning & Generating
-    base_model: ChatModel = Field("gpt-4o-mini-2024-07-18", description="The name of the model that will be fine-tuned by the generated training data.")
-    fine_tuned_model: str = Field("", description="The name of the OpenAI model that was fine-tuned with your posts.")
-    # Generating
-    upload_blog_identifier: str = Field("", description="The identifier of the blog which generated drafts will be uploaded to. This must be a blog associated with the same account as the configured Tumblr secret tokens.")
-    draft_count: PositiveInt = Field(150, description="The number of drafts to process. This will affect the number of tokens used with OpenAI")
-    tags_chance: NonNegativeFloat = Field(0.1, description="The chance to generate tags for any given post. This will incur extra calls to OpenAI.")
-    tags_developer_message: str = Field("You will be provided with a block of text, and your task is to extract a very short list of the most important subjects from it.", description="The developer message used to generate tags.")
-    @override
-    @classmethod
-    def settings_customise_sources(cls, settings_cls: type[BaseSettings], *args: PydanticBaseSettingsSource, **kwargs: PydanticBaseSettingsSource) -> tuple[PydanticBaseSettingsSource, ...]:
-        return (TomlConfigSettingsSource(settings_cls),)
-    @model_validator(mode="after")
-    def write_to_file(self) -> Self:
-        if not self.download_blog_identifiers:
-            rich.print("Enter the [cyan]identifiers of your blogs[/] that data should be [bold purple]downloaded[/] from, separated by commas.")
-            self.download_blog_identifiers = list(map(str.strip, Prompt.ask("[bold][Example] [dim]staff.tumblr.com,changes").split(",")))
-        if not self.upload_blog_identifier:
-            rich.print("Enter the [cyan]identifier of your blog[/] that drafts should be [bold purple]uploaded[/] to.")
-            self.upload_blog_identifier = Prompt.ask("[bold][Example] [dim]staff.tumblr.com or changes").strip()
-        toml_files = self.model_config.get("toml_file")
-        if isinstance(toml_files, (Path, str)):
-            self.dump_toml(toml_files)
-        elif isinstance(toml_files, Sequence):
-            for toml_file in toml_files:
-                self.dump_toml(toml_file)
-        return self
-    def dump_toml(self, toml_file: "StrPath") -> None:
-        toml_table = document()
-        dumped_model = self.model_dump(mode="json")
-        for name, field in self.__class__.model_fields.items():
-            if field.description:
-                for line in field.description.split(". "):
-                    toml_table.add(comment(f"{line.removesuffix('.')}."))
-            toml_table[name] = dumped_model[name]
-        Path(toml_file).write_text(
-            tomlkit.dumps(toml_table),
-            encoding="utf_8",
-        )

tumblrbot-1.4.6.dist-info/RECORD DELETED Viewed

@@ -1,16 +0,0 @@
-tumblrbot/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
-tumblrbot/__main__.py,sha256=fV0lBm5FqTvBoq5g8soG1x0w0qebyR_oL5_339z4GpM,1460
-tumblrbot/flow/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
-tumblrbot/flow/download.py,sha256=xSfic66FR-LIG0KtJMcM5KVd2hiijCH3cyD7dzFKwLM,2042
-tumblrbot/flow/examples.py,sha256=6A6bqHwLIUtEr-dv-FcWbMdVVMFImHhuMmlJLyuSW6U,4005
-tumblrbot/flow/fine_tune.py,sha256=X9xR9uPgiK6DKQ-lZ6oqwTPypUx5D5S1MiKrFKSm5ng,5381
-tumblrbot/flow/generate.py,sha256=Q6nUtmoj28-rGUCs4V0fuovJshvFMlmipyu9GGqnmzM,2147
-tumblrbot/utils/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
-tumblrbot/utils/common.py,sha256=tnKBBiEGQPOWByLi0vT31BzpntndbIP_JekGkgjy15U,1841
-tumblrbot/utils/config.py,sha256=AlHZLx74-202BNwELNE3MzTg2Ru7R_Q5u8h9S4QGkJk,5460
-tumblrbot/utils/models.py,sha256=bLB96qrHBr18_X6-zHatc-bczej0kLUrZxyceITAWqo,4936
-tumblrbot/utils/tumblr.py,sha256=9lAbjO-27cpju9Wewv26lyQoogybs8b1y8mvYIuHkqw,1293
-tumblrbot-1.4.6.dist-info/entry_points.txt,sha256=lTiN7PxAbyGY1fpCWApEw6NUIUgobfcOKhvn6cu3IQA,53
-tumblrbot-1.4.6.dist-info/WHEEL,sha256=G2gURzTEtmeR8nrdXUJfNiB3VYVxigPQ-bEQujpNiNs,82
-tumblrbot-1.4.6.dist-info/METADATA,sha256=IotLVzlM8nw8XwxwBt-TjGozYHEKuJRD1n1hdbevs1Q,10183
-tumblrbot-1.4.6.dist-info/RECORD,,

{tumblrbot-1.4.6.dist-info → tumblrbot-1.4.7.dist-info}/WHEEL RENAMED Viewed

File without changes

{tumblrbot-1.4.6.dist-info → tumblrbot-1.4.7.dist-info}/entry_points.txt RENAMED Viewed

File without changes

tumblrbot 1.4.6__py3-none-any.whl → 1.4.7__py3-none-any.whl

tumblrbot 1.4.6py3-none-any.whl → 1.4.7py3-none-any.whl