dvc-utils 0.0.5__py3-none-any.whl → 0.0.7__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
dvc_utils/main.py CHANGED
@@ -2,15 +2,12 @@ from functools import cache
2
2
  from os import environ as env, getcwd
3
3
  from os.path import join, relpath
4
4
  import shlex
5
- from subprocess import Popen, PIPE
6
5
  from typing import Optional, Tuple
7
6
 
8
7
  from click import option, argument, group
9
8
  import click
10
9
  import yaml
11
- from utz import process, singleton, err
12
-
13
- from dvc_utils.named_pipes import named_pipes
10
+ from utz import diff_cmds, process, err, singleton
14
11
 
15
12
 
16
13
  @group()
@@ -69,86 +66,6 @@ def dvc_cache_path(ref: str, dvc_path: Optional[str] = None, log: bool = False)
69
66
  return join(dvc_cache_dir(log=log), 'files', 'md5', dirname, basename)
70
67
 
71
68
 
72
- def diff_cmds(
73
- cmds1: list[str],
74
- cmds2: list[str],
75
- verbose: bool = False,
76
- color: bool = False,
77
- unified: int | None = None,
78
- ignore_whitespace: bool = False,
79
- **kwargs,
80
- ):
81
- """Run two sequences of piped commands and diff their output.
82
-
83
- Args:
84
- cmds1: First sequence of commands to pipe together
85
- cmds2: Second sequence of commands to pipe together
86
- verbose: Whether to print commands being executed
87
- color: Whether to show colored diff output
88
- unified: Number of unified context lines, or None
89
- ignore_whitespace: Whether to ignore whitespace changes
90
- **kwargs: Additional arguments passed to subprocess.Popen
91
-
92
- Each command sequence will be piped together before being compared.
93
- For example, if cmds1 = ['cat foo.txt', 'sort'], the function will
94
- execute 'cat foo.txt | sort' before comparing with cmds2's output.
95
-
96
- Adapted from https://stackoverflow.com/a/28840955"""
97
- with named_pipes(n=2) as pipes:
98
- (pipe1, pipe2) = pipes
99
- diff_cmd = [
100
- 'diff',
101
- *(['-w'] if ignore_whitespace else []),
102
- *(['-U', str(unified)] if unified is not None else []),
103
- *(['--color=always'] if color else []),
104
- pipe1,
105
- pipe2,
106
- ]
107
- diff = Popen(diff_cmd)
108
- processes = []
109
-
110
- for pipe, cmds in ((pipe1, cmds1), (pipe2, cmds2)):
111
- if verbose:
112
- err(f"Running pipeline: {' | '.join(cmds)}")
113
-
114
- # Create the pipeline of processes
115
- prev_process = None
116
- for i, cmd in enumerate(cmds):
117
- is_last = i + 1 == len(cmds)
118
-
119
- # For the first process, take input from the original source
120
- stdin = None if prev_process is None else prev_process.stdout
121
-
122
- # For the last process, output to the named pipe
123
- if is_last:
124
- with open(pipe, 'wb', 0) as pipe_fd:
125
- proc = Popen(
126
- cmd,
127
- stdin=stdin,
128
- stdout=pipe_fd,
129
- close_fds=True,
130
- **kwargs
131
- )
132
- # For intermediate processes, output to a pipe
133
- else:
134
- proc = Popen(
135
- cmd,
136
- stdin=stdin,
137
- stdout=PIPE,
138
- close_fds=True,
139
- **kwargs
140
- )
141
-
142
- if prev_process is not None:
143
- prev_process.stdout.close()
144
-
145
- processes.append(proc)
146
- prev_process = proc
147
-
148
- for p in [diff] + processes:
149
- p.wait()
150
-
151
-
152
69
  @cli.command('diff', short_help='Diff a DVC-tracked file at two commits (or one commit vs. current worktree), optionally passing both through another command first')
153
70
  @option('-c', '--color', is_flag=True, help='Colorize the output')
154
71
  @option('-r', '--refspec', default='HEAD', help='<commit 1>..<commit 2> (compare two commits) or <commit> (compare <commit> to the worktree)')
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: dvc-utils
3
- Version: 0.0.5
3
+ Version: 0.0.7
4
4
  Summary: CLI for diffing DVC files at two commits (or one commit vs. current worktree), optionally passing both through another command first
5
5
  Home-page: https://github.com/runsascoded/dvc-utils
6
6
  Author: Ryan Williams
@@ -15,7 +15,7 @@ CLI for diffing [DVC] files, optionally passing both through another command fir
15
15
  <!-- toc -->
16
16
  - [Installation](#installation)
17
17
  - [Usage](#usage)
18
- - [`dvc-utils diff`](#dvc-utils-diff)
18
+ - [`dvc-diff`](#dvc-diff)
19
19
  - [Examples](#examples)
20
20
  - [Parquet file](#parquet-diff)
21
21
  - [Schema diff](#parquet-schema-diff)
@@ -42,11 +42,13 @@ dvc-utils --help
42
42
  # worktree), optionally passing both through another command first
43
43
  ```
44
44
 
45
- ### `dvc-utils diff` <a id="dvc-utils-diff"></a>
46
- <!-- `bmdf -- dvc-utils diff --help` -->
45
+ The single subcommand, `dvc-utils diff`, is also exposed directly as `dvc-dff`:
46
+
47
+ ### `dvc-diff` <a id="dvc-diff"></a>
48
+ <!-- `bmdf -- dvc-diff --help` -->
47
49
  ```bash
48
- dvc-utils diff --help
49
- # Usage: dvc-utils diff [OPTIONS] [cmd...] <path>
50
+ dvc-diff --help
51
+ # Usage: dvc-diff [OPTIONS] [exec_cmd...] <path>
50
52
  #
51
53
  # Diff a file at two commits (or one commit vs. current worktree), optionally
52
54
  # passing both through `cmd` first
@@ -69,6 +71,8 @@ dvc-utils diff --help
69
71
  # to `diff`)
70
72
  # -v, --verbose Log intermediate commands to stderr
71
73
  # -w, --ignore-whitespace Ignore whitespace differences (pass `-w` to `diff`)
74
+ # -x, --exec-cmd TEXT Command(s) to execute before diffing; alternate
75
+ # syntax to passing commands as positional arguments
72
76
  # --help Show this message and exit.
73
77
  ```
74
78
 
@@ -91,7 +95,7 @@ parquet_schema() {
91
95
  parquet2json "$1" schema
92
96
  }
93
97
  export -f parquet_schema
94
- dvc-utils diff -r $commit^..$commit parquet_schema $path
98
+ dvc-diff -r $commit^..$commit parquet_schema $path
95
99
  ```
96
100
  <details><summary>Output</summary>
97
101
 
@@ -149,7 +153,7 @@ pretty_print_first_row() {
149
153
  parquet2json "$1" cat -l 1 | jq .
150
154
  }
151
155
  export -f pretty_print_first_row
152
- dvc-utils diff -r $commit^..$commit pretty_print_first_row $path
156
+ dvc-diff -r $commit^..$commit pretty_print_first_row $path
153
157
  ```
154
158
 
155
159
  <details><summary>Output</summary>
@@ -208,7 +212,7 @@ parquet_row_count() {
208
212
  parquet2json "$1" rowcount
209
213
  }
210
214
  export -f parquet_row_count
211
- dvc-utils diff -r $commit^..$commit parquet_row_count $path
215
+ dvc-diff -r $commit^..$commit parquet_row_count $path
212
216
  ```
213
217
 
214
218
  This time we get no output; [the given `$commit`][commit] didn't change the row count in the DVC-tracked Parquet file [`$path`][commit path].
@@ -0,0 +1,8 @@
1
+ dvc_utils/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
2
+ dvc_utils/main.py,sha256=1eiIL96OPY-dP12cNzHHDFB5KyGI2baauZgeDDjyxHs,5002
3
+ dvc_utils-0.0.7.dist-info/LICENSE,sha256=ZS8AReay7xmQzBAHwxIuTouGXz3SKgUa2_Sz8Ip0EzQ,1070
4
+ dvc_utils-0.0.7.dist-info/METADATA,sha256=kqz3QZm4TZOjhr2GsHjJPyfx0n0HBshk-O8fm3fjzs0,7107
5
+ dvc_utils-0.0.7.dist-info/WHEEL,sha256=bFJAMchF8aTQGUgMZzHJyDDMPTO3ToJ7x23SLJa1SVo,92
6
+ dvc_utils-0.0.7.dist-info/entry_points.txt,sha256=0JqFeb29N5ZrvwmIJrg4ii32xNFOXRul-HMq-3GOIw4,90
7
+ dvc_utils-0.0.7.dist-info/top_level.txt,sha256=jT0-PJa2t_eFRE9rn-52AjdnZ8nQeEHllf2kJmaGh80,10
8
+ dvc_utils-0.0.7.dist-info/RECORD,,
@@ -1,5 +1,5 @@
1
1
  Wheel-Version: 1.0
2
- Generator: bdist_wheel (0.44.0)
2
+ Generator: bdist_wheel (0.45.0)
3
3
  Root-Is-Purelib: true
4
4
  Tag: py3-none-any
5
5
 
@@ -1,2 +1,3 @@
1
1
  [console_scripts]
2
+ dvc-diff = dvc_utils.main:dvc_utils_diff
2
3
  dvc-utils = dvc_utils.main:cli
dvc_utils/named_pipes.py DELETED
@@ -1,19 +0,0 @@
1
- import os
2
- import shutil
3
- import tempfile
4
- from contextlib import contextmanager
5
-
6
-
7
- @contextmanager
8
- def named_pipes(n: int = 1):
9
- """Yield a list of paths to named pipes that are created and destroyed
10
-
11
- From https://stackoverflow.com/a/28840955"""
12
- dirname = tempfile.mkdtemp()
13
- try:
14
- paths = [os.path.join(dirname, 'named_pipe' + str(i)) for i in range(n)]
15
- for path in paths:
16
- os.mkfifo(path)
17
- yield paths
18
- finally:
19
- shutil.rmtree(dirname)
@@ -1,9 +0,0 @@
1
- dvc_utils/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
2
- dvc_utils/main.py,sha256=UhCm28Zu_xwsmfzOKgmAYJrCrfumryid_10F_-Rg-2M,7850
3
- dvc_utils/named_pipes.py,sha256=VQ2t9BYCazFq_-MABj4t2HS7GHDvSqXXx8fOLz5DsTc,492
4
- dvc_utils-0.0.5.dist-info/LICENSE,sha256=ZS8AReay7xmQzBAHwxIuTouGXz3SKgUa2_Sz8Ip0EzQ,1070
5
- dvc_utils-0.0.5.dist-info/METADATA,sha256=y46AoDbejlmv318zUD4aKiY9SprlRh9hdCBcoGZ4H4M,6924
6
- dvc_utils-0.0.5.dist-info/WHEEL,sha256=eOLhNAGa2EW3wWl_TU484h7q1UNgy0JXjjoqKoxAAQc,92
7
- dvc_utils-0.0.5.dist-info/entry_points.txt,sha256=W9OuZ6CX8QF9ojbqLtfXFo8Q2hnJ-zlcGY4_7nO8paM,49
8
- dvc_utils-0.0.5.dist-info/top_level.txt,sha256=jT0-PJa2t_eFRE9rn-52AjdnZ8nQeEHllf2kJmaGh80,10
9
- dvc_utils-0.0.5.dist-info/RECORD,,