PyPI - tinybird - Versions diffs - 0.0.1.dev0__py3-none-any.whl - Mend

tinybird 0.0.1.dev0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of tinybird might be problematic. Click here for more details.

Files changed (45) hide show

tinybird/__cli__.py +8 -0
tinybird/ch_utils/constants.py +244 -0
tinybird/ch_utils/engine.py +855 -0
tinybird/check_pypi.py +25 -0
tinybird/client.py +1281 -0
tinybird/config.py +117 -0
tinybird/connectors.py +428 -0
tinybird/context.py +23 -0
tinybird/datafile.py +5589 -0
tinybird/datatypes.py +434 -0
tinybird/feedback_manager.py +1022 -0
tinybird/git_settings.py +145 -0
tinybird/sql.py +865 -0
tinybird/sql_template.py +2343 -0
tinybird/sql_template_fmt.py +281 -0
tinybird/sql_toolset.py +350 -0
tinybird/syncasync.py +682 -0
tinybird/tb_cli.py +25 -0
tinybird/tb_cli_modules/auth.py +252 -0
tinybird/tb_cli_modules/branch.py +1043 -0
tinybird/tb_cli_modules/cicd.py +434 -0
tinybird/tb_cli_modules/cli.py +1571 -0
tinybird/tb_cli_modules/common.py +2082 -0
tinybird/tb_cli_modules/config.py +344 -0
tinybird/tb_cli_modules/connection.py +803 -0
tinybird/tb_cli_modules/datasource.py +900 -0
tinybird/tb_cli_modules/exceptions.py +91 -0
tinybird/tb_cli_modules/fmt.py +91 -0
tinybird/tb_cli_modules/job.py +85 -0
tinybird/tb_cli_modules/pipe.py +858 -0
tinybird/tb_cli_modules/regions.py +9 -0
tinybird/tb_cli_modules/tag.py +100 -0
tinybird/tb_cli_modules/telemetry.py +310 -0
tinybird/tb_cli_modules/test.py +107 -0
tinybird/tb_cli_modules/tinyunit/tinyunit.py +340 -0
tinybird/tb_cli_modules/tinyunit/tinyunit_lib.py +71 -0
tinybird/tb_cli_modules/token.py +349 -0
tinybird/tb_cli_modules/workspace.py +269 -0
tinybird/tb_cli_modules/workspace_members.py +212 -0
tinybird/tornado_template.py +1194 -0
tinybird-0.0.1.dev0.dist-info/METADATA +2815 -0
tinybird-0.0.1.dev0.dist-info/RECORD +45 -0
tinybird-0.0.1.dev0.dist-info/WHEEL +5 -0
tinybird-0.0.1.dev0.dist-info/entry_points.txt +2 -0
tinybird-0.0.1.dev0.dist-info/top_level.txt +4 -0

tinybird/tb_cli_modules/regions.py ADDED Viewed

@@ -0,0 +1,9 @@
+from typing import Optional, TypedDict
+class Region(TypedDict):
+    name: str
+    provider: str
+    api_host: str
+    host: str
+    default_password: Optional[str]

tinybird/tb_cli_modules/tag.py ADDED Viewed

@@ -0,0 +1,100 @@
+from typing import Optional
+import click
+from click import Context
+from tinybird.feedback_manager import FeedbackManager
+from tinybird.tb_cli_modules.cli import cli
+from tinybird.tb_cli_modules.common import coro, echo_safe_humanfriendly_tables_format_smart_table
+@cli.group()
+@click.pass_context
+def tag(ctx: Context) -> None:
+    """Tag commands"""
+@tag.command(name="ls")
+@click.argument("tag_name", required=False)
+@click.pass_context
+@coro
+async def tag_ls(ctx: Context, tag_name: Optional[str]) -> None:
+    """List all the tags of the current Workspace or the resources associated to a specific tag."""
+    client = ctx.ensure_object(dict)["client"]
+    response = await client.get_all_tags()
+    if tag_name:
+        the_tag = [tag for tag in response["tags"] if tag["name"] == tag_name]
+        columns = ["name", "id", "type"]
+        table = []
+        if len(the_tag) > 0:
+            for resource in the_tag[0]["resources"]:
+                table.append([resource["name"], resource["id"], resource["type"]])
+        click.echo(FeedbackManager.info_tag_resources(tag_name=tag_name))
+        echo_safe_humanfriendly_tables_format_smart_table(table, column_names=columns)
+        return
+    columns = ["tag", "resources"]
+    table = []
+    for tag in response["tags"]:
+        unique_resources = []
+        for resource in tag["resources"]:
+            if resource.get("name", "") not in unique_resources:
+                unique_resources.append(resource)  # Reducing by name in case there are duplicates.
+        table.append([tag["name"], len(unique_resources)])
+    click.echo(FeedbackManager.info_tag_list())
+    echo_safe_humanfriendly_tables_format_smart_table(table, column_names=columns)
+@tag.command(name="create")
+@click.argument("tag_name")
+@click.pass_context
+@coro
+async def tag_create(ctx: Context, tag_name: str) -> None:
+    """Create a tag in the current Workspace."""
+    client = ctx.ensure_object(dict)["client"]
+    await client.create_tag(name=tag_name)
+    click.echo(FeedbackManager.success_tag_created(tag_name=tag_name))
+@tag.command(name="rm")
+@click.argument("tag_name")
+@click.option("--yes", is_flag=True, default=False, help="Do not ask for confirmation to delete the tag.")
+@click.pass_context
+@coro
+async def tag_rm(ctx: Context, tag_name: str, yes: bool) -> None:
+    """Remove a tag from the current Workspace."""
+    client = ctx.ensure_object(dict)["client"]
+    remove_tag = True
+    if not yes:
+        all_tags = await client.get_all_tags()
+        the_tag = [tag for tag in all_tags["tags"] if tag["name"] == tag_name]
+        if len(the_tag) > 0:
+            unique_resources = []
+            for resource in the_tag[0]["resources"]:
+                if resource.get("name", "") not in unique_resources:
+                    unique_resources.append(resource)  # Reducing by name in case there are duplicates.
+            if len(unique_resources) > 0:
+                remove_tag = click.confirm(
+                    FeedbackManager.warning_tag_remove(tag_name=tag_name, resources_len=len(unique_resources))
+                )
+            else:
+                remove_tag = click.confirm(FeedbackManager.warning_tag_remove_no_resources(tag_name=tag_name))
+        else:
+            remove_tag = False
+            click.echo(FeedbackManager.error_tag_not_found(tag_name=tag_name))
+    if remove_tag:
+        await client.delete_tag(tag_name)
+        click.echo(FeedbackManager.success_tag_removed(tag_name=tag_name))

tinybird/tb_cli_modules/telemetry.py ADDED Viewed

@@ -0,0 +1,310 @@
+import functools
+import json
+import os
+import platform
+import re
+import sys
+import threading
+import uuid
+from copy import deepcopy
+from datetime import datetime
+from typing import Any, Callable, Dict, List, Optional, Tuple
+from urllib.parse import urlencode
+import requests
+from tinybird.config import CURRENT_VERSION
+TELEMETRY_TIMEOUT: int = 1
+TELEMETRY_DATASOURCE: str = "tb_cli_telemetry"
+def get_ci_product_name() -> Optional[str]:
+    if _is_env_true("TB_DISABLE_CI_DETECTION"):
+        return None
+    CI_CHECKS: List[Tuple[str, Callable[[], bool]]] = [
+        ("Azure pipelines", lambda: _is_env_true("TF_BUILD")),
+        ("GitHub Actions", lambda: _is_env_true("GITHUB_ACTIONS")),
+        ("Appveyor", lambda: _is_env_true("APPVEYOR")),
+        ("Travis CI", lambda: _is_env_true("TRAVIS")),
+        ("Circle CI", lambda: _is_env_true("CIRCLECI")),
+        ("Amazon Web Services CodeBuild", lambda: _is_env_present(["CODEBUILD_BUILD_ID", "AWS_REGION"])),
+        ("Jenkins", lambda: _is_env_present(["BUILD_ID", "BUILD_URL"])),
+        ("Google Cloud Build", lambda: _is_env_present(["BUILD_ID", "PROJECT_ID"])),
+        ("TeamCity", lambda: _is_env_present(["TEAMCITY_VERSION"])),
+        ("JetBrains Space", lambda: _is_env_present(["JB_SPACE_API_URL"])),
+        ("Generic CI", lambda: _is_env_true("CI")),
+    ]
+    return next((check[0] for check in CI_CHECKS if check[1]()), None)
+def is_ci_environment() -> bool:
+    ci_product: Optional[str] = get_ci_product_name()
+    return ci_product is not None
+def silence_errors(f: Callable) -> Callable:
+    """Decorator to silence all errors in the decorated
+    function.
+    """
+    @functools.wraps(f)
+    def wrapper(*args, **kwargs) -> Any:
+        try:
+            return f(*args, **kwargs)
+        except Exception:
+            return None
+    return wrapper
+def _is_env_true(env_var: str) -> bool:
+    """Checks if `env_var` is `true` or `1`."""
+    return os.getenv(env_var, "").lower() in ("true", "1")
+def _is_env_present(envs: List[str]) -> bool:
+    """Checks if all of the variables passed in `envs`
+    are defined (ie: not empty)
+    """
+    return all(os.getenv(env_var, None) is not None for env_var in envs)
+def _hide_tokens(text: str) -> str:
+    """Cuts any token in a way that they get unusable if leaked,
+    but we still can use them for debugging if needed.
+    """
+    return re.sub(r"p\.ey[A-Za-z0-9-_\.]+", lambda s: f"{s[0][:10]}...{s[0][-10:]}", text)
+class TelemetryHelper:
+    def __init__(self, tb_host: Optional[str] = None, max_enqueued_events: int = 5) -> None:
+        self.tb_host = tb_host or os.getenv("TB_CLI_TELEMETRY_HOST", "https://api.tinybird.co")
+        self.max_enqueued_events: int = max_enqueued_events
+        self.enabled: bool = True
+        self.events: List[Dict[str, Any]] = []
+        self.telemetry_token: Optional[str] = None
+        run_id = str(uuid.uuid4())
+        self._defaults: Dict[str, Any] = {
+            # Per-event values
+            "event": "<the event>",
+            "event_data": "<the event data>",
+            "timestamp": "<the timestamp>",
+            # Static values
+            "run_id": run_id,
+        }
+        self._threads: List[threading.Thread] = []
+        self.log(f"Telemetry initialized with run_id: {run_id}")
+    @silence_errors
+    def add_event(self, event: str, event_data: Dict[str, Any]) -> None:
+        if not self.enabled:
+            self.log("Helper is disabled")
+            return
+        if "x.y.z" in CURRENT_VERSION and not _is_env_true("TB_CLI_TELEMETRY_SEND_IN_LOCAL"):
+            self.log("Not sending events in local development mode")
+            return
+        # Let's save deep copies to not interfere with original objects
+        event_dict: Dict[str, Any] = deepcopy(self._defaults)
+        event_dict["event"] = event
+        event_dict["event_data"] = json.dumps(event_data)
+        event_dict["timestamp"] = datetime.utcnow().isoformat()
+        self.events.append(event_dict)
+        if len(self.events) >= self.max_enqueued_events:
+            self.flush()
+    @silence_errors
+    def flush(self, wait: bool = False) -> None:
+        if self.enabled and len(self.events) > 0:
+            # Take the ownership for the pending events.
+            #
+            # We need this because the proper flush() is done in
+            # a thread to avoid blocking  the user and we could send
+            # the same event twice if we maintain the same list after
+            # during the sending.
+            events: List[Dict[str, Any]] = self.events
+            self.events = []
+            self.log(f"Flusing {len(events)} events in a new thread...")
+            thread: threading.Thread = threading.Thread(target=self._flush, args=[events])
+            self._threads.append(thread)
+            thread.start()
+        if wait:
+            for t in self._threads:
+                t.join()
+                if t.is_alive():
+                    self.log(f"Couldn't wait for the end of the thread {t.name}")
+            self._threads.clear()
+    @silence_errors
+    def _flush(self, events: List[Dict[str, Any]]) -> None:
+        """Actual flush. This is where we use HFI to ingest events."""
+        timeout: int
+        try:
+            timeout = int(os.getenv("TB_CLI_TELEMETRY_TIMEOUT", TELEMETRY_TIMEOUT))
+            timeout = max(TELEMETRY_TIMEOUT, timeout)
+        except ValueError:
+            timeout = TELEMETRY_TIMEOUT
+        if not self.telemetry_token:
+            self.telemetry_token = os.getenv("TB_CLI_TELEMETRY_TOKEN")
+            if self.telemetry_token:
+                self.log("Got telemetry token from environment TB_CLI_TELEMETRY_TOKEN")
+        with requests.Session() as session:
+            if not self.telemetry_token:
+                url: str = f"{self.tb_host}/v0/regions"
+                self.log(f"Requesting token from {url}...")
+                try:
+                    r = session.get(url, timeout=timeout)
+                    regions: List[Dict[str, Any]] = json.loads(r.content.decode())["regions"]
+                    self.telemetry_token = next(
+                        (r.get("telemetry_token", None) for r in regions if r["api_host"] == self.tb_host), None
+                    )
+                    if self.telemetry_token:
+                        self.log(f"Got telemetry token from {url}")
+                except requests.exceptions.Timeout:
+                    self.log(f"Disabling due to timeout after {timeout} seconds")
+                    self.enabled = False
+                    return
+                except Exception as ex:
+                    self.log(str(ex))
+            if not self.telemetry_token:
+                self.log("Disabling due to lack of token")
+                self.enabled = False
+                return
+            self.log(f"token={self.telemetry_token}")
+            data: str = _hide_tokens("\n".join(json.dumps(e) for e in events))
+            # Note we don't use `wait` as this telemetry isn't a critical
+            # operation to support and we don't want to generate overhead
+            params: Dict[str, Any] = {"name": TELEMETRY_DATASOURCE, "token": self.telemetry_token}
+            url = f"{self.tb_host}/v0/events?{urlencode(params)}"
+            try:
+                self.log(f"Sending data to {url}...")
+                r = session.post(url, data=data, timeout=timeout)
+            except requests.exceptions.Timeout:
+                self.log(f"Disabling due to timeout after {timeout} seconds")
+                self.enabled = False
+                return
+            self.log(f"Received status {r.status_code}: {r.text}")
+            if r.status_code == 200 or r.status_code == 202:
+                self.log(f"Successfully sent {len(events)} events to {self.tb_host}")
+                self.events.clear()
+                return
+            if r.status_code in (403, 404):
+                self.log(f"Disabling due to {r.status_code} errors")
+                self.enabled = False
+                return
+            if r.status_code >= 500:
+                self.log(f"Disabling telemetry and discarding {len(events)} events")
+                self.enabled = False
+    @silence_errors
+    def log(self, msg: str) -> None:
+        """Internal logging function to help with development and debugging."""
+        if not _is_env_true("TB_CLI_TELEMETRY_DEBUG"):
+            return
+        print(f"> Telemetry: {msg}")  # noqa: T201
+_helper_instance: Optional[TelemetryHelper] = None
+@silence_errors
+def init_telemetry() -> None:
+    """Setups the telemetry helper with the config present in `config`.
+    If no config is provided, it tries to get it from the passed Click context.
+    We need to call this method any time we suspect the config changes any value.
+    """
+    telemetry = _get_helper()
+    if telemetry:
+        telemetry.log("Initialized")
+@silence_errors
+def add_telemetry_event(event: str, **kw_event_data: Any) -> None:
+    """Adds a new telemetry event."""
+    telemetry = _get_helper()
+    if not telemetry:
+        return
+    try:
+        telemetry.add_event(event, dict(**kw_event_data))
+    except Exception as ex:
+        telemetry.log(str(ex))
+@silence_errors
+def add_telemetry_sysinfo_event() -> None:
+    """Collects system info and sends a `system_info` event
+    with the data.
+    """
+    ci_product: Optional[str] = get_ci_product_name()
+    add_telemetry_event(
+        "system_info",
+        platform=platform.platform(),
+        system=platform.system(),
+        arch=platform.machine(),
+        processor=platform.processor(),
+        python_runtime=platform.python_implementation(),
+        python_version=platform.python_version(),
+        is_ci=ci_product is not None,
+        ci_product=ci_product,
+        cli_version=CURRENT_VERSION,
+        cli_args=sys.argv[1:] if len(sys.argv) > 1 else [],
+    )
+@silence_errors
+def flush_telemetry(wait: bool = False) -> None:
+    """Flushes all pending telemetry events."""
+    telemetry = _get_helper()
+    if not telemetry:
+        return
+    try:
+        telemetry.flush(wait=wait)
+    except Exception as ex:
+        telemetry.log(str(ex))
+@silence_errors
+def _get_helper() -> Optional[TelemetryHelper]:
+    """Returns the shared TelemetryHelper instance."""
+    if _is_env_true("TB_CLI_TELEMETRY_OPTOUT"):
+        return None
+    global _helper_instance
+    if not _helper_instance:
+        _helper_instance = TelemetryHelper()
+    return _helper_instance

tinybird/tb_cli_modules/test.py ADDED Viewed

@@ -0,0 +1,107 @@
+# This is a command file for our CLI. Please keep it clean.
+#
+# - If it makes sense and only when strictly necessary, you can create utility functions in this file.
+# - But please, **do not** interleave utility functions and command definitions.
+import glob
+from typing import Any, Dict, Iterable, List, Tuple
+import click
+from tinybird.client import AuthNoTokenException
+from tinybird.feedback_manager import FeedbackManager
+from tinybird.tb_cli_modules.cli import cli
+from tinybird.tb_cli_modules.common import coro, create_tb_client, gather_with_concurrency
+from tinybird.tb_cli_modules.config import CLIConfig
+from tinybird.tb_cli_modules.exceptions import CLIException
+from tinybird.tb_cli_modules.tinyunit.tinyunit import (
+    TestSummaryResults,
+    generate_file,
+    parse_file,
+    run_test_file,
+    test_run_summary,
+)
+@cli.group()
+@click.pass_context
+def test(ctx: click.Context) -> None:
+    """Test commands."""
+@test.command(
+    name="run",
+    help="Run the test suite, a file, or a test. To skip test to run in branches and CI put them in a 'skip_in_branch' folder.",
+)
+@click.argument("file", nargs=-1)
+@click.option("-v", "--verbose", is_flag=True, default=False, help="Enable verbose (show results)", type=bool)
+@click.option("--fail", "only_fail", is_flag=True, default=False, help="Showy onl failed/error tests", type=bool)
+@click.option("-c", "--concurrency", help="How many test to run concurrently", default=1, type=click.IntRange(1, 10))
+@click.pass_context
+@coro
+async def test_run(ctx: click.Context, file: Tuple[str, ...], verbose: bool, only_fail: bool, concurrency: int) -> None:
+    results: List[TestSummaryResults] = []
+    try:
+        tb_client = create_tb_client(ctx)
+        config = CLIConfig.get_project_config()
+        if config.get("token") is None:
+            raise AuthNoTokenException
+        workspaces: List[Dict[str, Any]] = (await tb_client.user_workspaces_and_branches()).get("workspaces", [])
+        current_ws: Dict[str, Any] = next(
+            (workspace for workspace in workspaces if config and workspace.get("id", ".") == config.get("id", "..")), {}
+        )
+    except Exception as e:
+        raise CLIException(FeedbackManager.error_exception(error=e))
+    file_list: Iterable[str] = file if len(file) > 0 else glob.glob("./tests/**/*.y*ml", recursive=True)
+    click.echo(FeedbackManager.info_skipping_resource(resource="regression.yaml"))
+    file_list = [f for f in file_list if not f.endswith("regression.yaml")]
+    final_file_list = []
+    for f in file_list:
+        if "skip_in_branch" in f and current_ws and current_ws.get("is_branch"):
+            click.echo(FeedbackManager.info_skipping_resource(resource=f))
+        else:
+            final_file_list.append(f)
+    file_list = final_file_list
+    async def run_test(tb_client, test_file, results):
+        try:
+            test_result = await run_test_file(tb_client, test_file)
+            results.append(TestSummaryResults(filename=test_file, results=test_result, semver=tb_client.semver))
+        except Exception as e:
+            if verbose:
+                click.echo(FeedbackManager.error_exception(error=e))
+            raise CLIException(FeedbackManager.error_running_test(file=test_file))
+    test_tasks = [run_test(tb_client, test_file, results) for test_file in file_list]
+    await gather_with_concurrency(concurrency, *test_tasks)
+    if len(results) <= 0:
+        click.echo(FeedbackManager.warning_no_test_results())
+    else:
+        test_run_summary(results, only_fail=only_fail, verbose_level=int(verbose))
+@test.command(name="init", help="Initialize a file list with a simple test suite.")
+@click.argument("files", nargs=-1)
+@click.option("--force", is_flag=True, default=False, help="Override existing files")
+@click.pass_context
+@coro
+async def test_init(ctx: click.Context, files: Tuple[str, ...], force: bool) -> None:
+    if len(files) == 0:
+        files = ("tests/default.yaml",)
+    for file in files:
+        generate_file(file, overwrite=force)
+@test.command(name="parse", help="Read the contents of a test file list.")
+@click.argument("files", nargs=-1)
+@click.pass_context
+@coro
+async def test_parse(ctx: click.Context, files: Tuple[str, ...]) -> None:
+    for f in files:
+        click.echo(f"\nFile: {f}")
+        for test in parse_file(f):
+            click.echo(test)