PyPI - visidata - Versions diffs - 3.1.1__py3-none-any.whl → 3.3__py3-none-any.whl - Mend

visidata 3.1.1py3-none-any.whl → 3.3py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (99) hide show

visidata/__init__.py +2 -2
visidata/_input.py +106 -58
visidata/_open.py +10 -7
visidata/_types.py +2 -2
visidata/aggregators.py +125 -16
visidata/apps/vdsql/_ibis.py +8 -13
visidata/basesheet.py +4 -3
visidata/canvas.py +11 -7
visidata/clipboard.py +11 -2
visidata/cliptext.py +68 -23
visidata/cmdlog.py +5 -1
visidata/column.py +48 -33
visidata/ddwplay.py +2 -2
visidata/deprecated.py +96 -63
visidata/errors.py +41 -5
visidata/{features → experimental}/helloworld.py +1 -1
visidata/experimental/liveupdate.py +1 -1
visidata/expr.py +1 -0
visidata/extensible.py +4 -0
visidata/features/cmdpalette.py +64 -25
visidata/features/describe.py +2 -2
visidata/features/expand_cols.py +7 -5
visidata/features/freeze.py +14 -2
visidata/features/go_col.py +3 -3
visidata/features/graph_zoom_y.py +47 -0
visidata/features/incr.py +7 -3
visidata/features/join.py +23 -12
visidata/features/layout.py +8 -4
visidata/features/melt.py +1 -0
visidata/features/rank.py +103 -0
visidata/features/reload_every.py +11 -8
visidata/features/sysedit.py +14 -4
visidata/features/transpose.py +1 -0
visidata/features/window.py +12 -0
visidata/form.py +10 -9
visidata/freqtbl.py +47 -3
visidata/fuzzymatch.py +11 -7
visidata/graph.py +5 -3
visidata/guides/AggregatorsSheet.md +84 -0
visidata/guides/CommandsSheet.md +1 -0
visidata/guides/MacrosSheet.md +1 -1
visidata/guides/RankGuide.md +51 -0
visidata/guides/TypesSheet.md +1 -1
visidata/guides/WindowFunctionGuide.md +49 -0
visidata/help.py +23 -6
visidata/indexsheet.py +1 -1
visidata/loaders/_pandas.py +3 -1
visidata/loaders/archive.py +33 -6
visidata/loaders/csv.py +12 -1
visidata/loaders/eml.py +2 -0
visidata/loaders/f5log.py +2 -2
visidata/loaders/fec.py +6 -9
visidata/loaders/fixed_width.py +2 -0
visidata/loaders/hdf5.py +34 -10
visidata/loaders/npy.py +54 -23
visidata/loaders/orgmode.py +3 -2
visidata/loaders/pandas_freqtbl.py +4 -0
visidata/loaders/psv.py +13 -0
visidata/loaders/sqlite.py +1 -1
visidata/loaders/vds.py +3 -4
visidata/macros.py +5 -4
visidata/main.py +21 -11
visidata/mainloop.py +8 -5
visidata/man/parse_options.py +3 -2
visidata/man/vd.1 +38 -17
visidata/man/vd.txt +47 -17
visidata/menu.py +10 -10
visidata/metasheets.py +3 -3
visidata/mouse.py +3 -0
visidata/movement.py +6 -3
visidata/pyobj.py +17 -9
visidata/save.py +10 -2
visidata/selection.py +29 -18
visidata/settings.py +9 -5
visidata/sheets.py +124 -48
visidata/shell.py +2 -2
visidata/sidebar.py +11 -8
visidata/sort.py +89 -11
visidata/statusbar.py +10 -9
visidata/tests/test_cliptext.py +164 -0
visidata/tests/test_commands.py +6 -2
visidata/tests/test_menu.py +1 -1
visidata/textsheet.py +34 -8
visidata/themes/ascii8.py +2 -2
visidata/themes/light.py +5 -0
visidata/threads.py +38 -8
visidata/utils.py +15 -1
visidata/vendor/__init__.py +0 -0
{visidata-3.1.1.data → visidata-3.3.data}/data/share/man/man1/vd.1 +38 -17
{visidata-3.1.1.data → visidata-3.3.data}/data/share/man/man1/visidata.1 +38 -17
{visidata-3.1.1.dist-info → visidata-3.3.dist-info}/METADATA +62 -15
{visidata-3.1.1.dist-info → visidata-3.3.dist-info}/RECORD +98 -92
{visidata-3.1.1.dist-info → visidata-3.3.dist-info}/WHEEL +1 -1
{visidata-3.1.1.dist-info → visidata-3.3.dist-info}/entry_points.txt +1 -0
visidata-3.1.1.data/scripts/vd +0 -6
{visidata-3.1.1.data → visidata-3.3.data}/data/share/applications/visidata.desktop +0 -0
{visidata-3.1.1.data → visidata-3.3.data}/scripts/vd2to3.vdx +0 -0
{visidata-3.1.1.dist-info → visidata-3.3.dist-info}/LICENSE.gpl3 +0 -0
{visidata-3.1.1.dist-info → visidata-3.3.dist-info}/top_level.txt +0 -0

visidata/guides/AggregatorsSheet.md ADDED Viewed

@@ -0,0 +1,84 @@
+---
+sheet: AggregatorSheet
+---
+# Aggregations like sum, mean, and distinct
+Aggregators provide summary statistics for grouped rows.
+The current aggregators include:
+   min           smallest value in the group
+   max           largest value in the group
+   avg/mean      average value of the group
+   mode          most frequently appearing value in group
+   median        median value in the group
+   q3/q4/q5/q10  add quantile aggregators to group (e.g. q4 adds p25, p50, p75)
+   sum           total summation of all numbers in the group
+   distinct      number of distinct values in the group
+   count         number of values in the group
+   keymax        key of the row with the largest value in the group
+   list          gathers values in column into a list
+   stdev         standard deviation of values
+## View a one-off aggregation of a column
+- {help.commands.memo-aggregate}
+## Create an aggregator column
+Aggregated columns appear in the **Frequency Table** and **Pivot Table** (grouped sheets).  Aggregated values will also appear at the bottom of their columns in the source sheet.
+- {help.commands.aggregate-col}
+Then aggregate the sheet with one of the grouping commands:
+- {help.commands.freq-col}
+- {help.commands.pivot}
+Aggregators can be viewed and modified on the **Columns Sheet** in the `aggregators` column.
+- {help.commands.columns-sheet}
+## The Describe Sheet
+To get a predefined set of summary statistics for every column in the sheet, use the **Describe Sheet* :
+- {help.commands.describe-all}
+## Examples
+Sample input sheet **sales**:
+   date        color  price
+   ----------  -----  -----
+   2024-09-01  R      30
+   2024-09-02  B      28
+   2024-09-03  R      100
+   2024-09-03  B      33
+   2024-09-03  B      99
+1. Move to the `price` column
+2. Set it to currency: [:keys]$[/key]
+3. Quickly show average price
+    - [:keys]z+[/] (`memo-aggregate`) then enter 'avg'
+4. Add an `sum` aggregator column:
+    - Press [:keys]+[/] (`aggregate-column`) then enter 'sum'
+5. Move to the date column [:keys]gh[/]
+6. Generate a **Frequency Table** by `date`
+    - [:keys]Shift-F[/] (`freq`)
+   date        count  price_sum
+   ----------  -----  ---------
+   2024-09-03  3      232.00
+   2024-09-01  1      30.00
+   2024-09-02  1      28.00
+## Creating new aggregator functions
+To add a new aggregator to compute the range of the grouped values (max - min), add the following to `.visidatarc`:
+[:code]vd.aggregator('range', lambda values: max(values) - min(values), 'range of values')[/]
+The `values` parameter is a list of typed values from the column, with the function returning the aggregated value.
+The new aggregator will now be available the next time VisiData is started.

visidata/guides/CommandsSheet.md CHANGED Viewed

@@ -8,6 +8,7 @@ Start typing a command longname or keyword in its helpstring.
 - [:code]Enter[/] to execute top command.
 - [:code]Tab[/] to highlight top command and provide a numeric jumplist.
+- [:code]PgUp[/]/[:code]PgDn[/] to scroll through commands.
 When a command is highlighted:

visidata/guides/MacrosSheet.md CHANGED Viewed

@@ -6,7 +6,7 @@ The basic usage is:
     2. Execute a series of commands.
     3. `m` again to complete the recording, and prompt for the keystroke or longname to bind it to.
-The macro will then be executed everytime the provided keystroke or longname are used. Note: the Alt+keys and the function keys are left unbound; overriding other keys may conflict with existing bindings, now or in the future.
+The macro will then be executed every time the provided keystroke or longname are used. Note: the Alt+keys and the function keys are left unbound; overriding other keys may conflict with existing bindings, now or in the future.
 Executing a macro will the series of commands starting on the current row and column on the current sheet.

visidata/guides/RankGuide.md ADDED Viewed

@@ -0,0 +1,51 @@
+# Ranking
+Ranking assigns numeric ranks to rows based on column values. VisiData provides two ranking approaches: sheet-wide ranking and group-based ranking.
+## Sheet-wide ranking
+[:keys]addcol-sheetrank[/] ranks all rows across the entire sheet.
+Navigate to the column to rank by and execute [:keys]addcol-sheetrank[/]. A new column appears with ranks, where 1 indicates the best value.
+**Example:**
+```
+Name   | Salary | Salary_rank
+Alice  | 95000  | 1
+Bob    | 85000  | 2
+Carol  | 70000  | 3
+```
+## Group-based ranking
+[:keys]addcol-aggregate[/] with [:code]rank[/] aggregator ranks rows within groups defined by key columns.
+1. Set key columns with [:keys]![/] (defines groups)
+2. Navigate to the column to rank by
+3. Execute [:keys]addcol-aggregate[/]
+4. Select [:code]rank[/] aggregator
+**Example with Department as key column:**
+```
+Name   | Department  | Salary | Salary_rank
+Alice  | Engineering | 95000  | 1
+Bob    | Engineering | 85000  | 2
+Carol  | Sales       | 70000  | 1
+Dave   | Sales       | 65000  | 2
+```
+Alice and Carol both receive rank 1 as the highest earners in their respective departments.
+## Sort direction
+Ranking follows the current sort direction of the column:
+- Ascending sort: lower values get better ranks
+- Descending sort: higher values get better ranks
+## Usage patterns
+**Global comparison:** Use [:keys]addcol-sheetrank[/] to find overall leaders across all data.
+**Category comparison:** Use [:keys]addcol-aggregate[/] + [:code]rank[/] to find leaders within each group defined by key columns.
+**Multiple groupings:** Set multiple key columns before group ranking for complex categorization.

visidata/guides/TypesSheet.md CHANGED Viewed

@@ -17,7 +17,7 @@ VisiData pre-set defaults for formatting types:
 - `currency` removes non-numeric characters and parses the remainder as `float`.
 - `date` parses dates into date object (shown as ISO8601).
 - `vlen` formats the cell value to the length of the content
-- `float` uses the decimal seperator, keeping two significant digits.
+- `float` uses the decimal separator, keeping two significant digits.
 Change float precision with:
 - {help.commands.setcol-precision-less}

visidata/guides/WindowFunctionGuide.md ADDED Viewed

@@ -0,0 +1,49 @@
+---
+sheet: Sheet
+---
+# Create a window over consecutive rows
+Window functions enable computations that relate the current window to surrounding rows, like cumulative sum, rolling averages or lead/lag computations.
+{help.commands.addcol-window}
+With large window sizes, [:code]g'[/] (`freeze-sheet`) to calculate all cells and copy the entire sheet into a new source sheet, which will conserve CPU.
+## Examples
+   date        color  price
+   ----------  -----  -----
+   2024-09-01  R      30
+   2024-09-02  B      28
+   2024-09-03  R      100
+   2024-09-03  B      33
+   2024-09-03  B      99
+1. [:keys]#[/] (`type-int`) on the **price** column to type as int.
+2. [:keys]w[/] (`addcol-window`) on the **price** column, followed by `1 2`, to create a window consisting of 4 rows: 1 row before the current row, and 2 rows after.
+3. To create a moving average of the values in the window, add a new column with a python expression: [:keys]=[/] (`addcol-expr`)
+followed by `sum(price_window)/len(price_window)`
+date            color   price   price_window            sum(price_window)/len(price_window)
+----------      -----   -----   -------------------     -----------------------------------
+2024-09-01      R       38      [4] ; 38; 28; 100       41.5
+2024-09-02      B       28      [4] 38; 28; 100; 33     49.75
+2024-09-03      R       100     [4] 28; 100; 33; 99     65.0
+2024-09-03      B       33      [4] 100; 33; 99;        58.0
+2024-09-03      B       99      [4] 33; 99; ;           33.0
+## Workflows
+### Create a cumulative sum
+1. Set the before window size to the total number of rows in the table, and the after rows to 0. In the above example that would be `w 5 0` (`addcol-window`).
+2. Add an expression ([:keys]=[/] (`addcol-expr`) of `sum(window)` where `window` is the name of the window function column.
+### Compute the change between rows
+1. `w 1 0` on the `foo` column to create a window function of size 1 before and 0 after.
+2. Add a python expression. The window function column is 'foo_window':
+    `=foo_window[1] - foo_window[0] if len(foo_window) > 1 else None`

visidata/help.py CHANGED Viewed

@@ -4,7 +4,24 @@ import collections
 from visidata import VisiData, MetaSheet, ColumnAttr, Column, BaseSheet, VisiDataMetaSheet, SuspendCurses
 from visidata import vd, asyncthread, ENTER, drawcache, AttrDict, TextSheet
-vd.option('disp_expert', 0, 'max level of options and columns to include')
+vd.option('disp_help_flags', 'cmdpalette guides help hints inputfield inputkeys nometacols sidebar',
+    '''list of helper features to enable (space-separated):
+    - "cmdpalette": exec-longname suggestions
+    - "guides": guides in sidebar
+    - "help": help sidebar collapsed by default
+    - "hints": context-sensitive hints on menu line
+    - "inputfield": context-sensitive help for each input field
+    - "inputkeys": input quick reference in sidebar
+    - "nometacols": hide expert columns on metasheets
+    - "sidebar": context-sensitive sheet help in sidebar
+    - "all": enable all helper features''')
+@VisiData.api
+def wantsHelp(vd, feat):
+    return feat in vd.options.disp_help_flags or 'all' in vd.options.disp_help_flags
 @BaseSheet.api
 def hint_basichelp(sheet):
@@ -99,12 +116,13 @@ class HelpPane:
     def draw(self, scr, x=None, y=None, **kwargs):
         if not scr: return
-#        if vd.options.disp_help <= 0:
+#        if not vd.wantsHelp('statushelp'):
 #            if self.scr:
 #                self.scr.erase()
 #                self.scr.refresh()
 #                self.scr = None
 #            return
         if y is None: y=0  # show at top of screen by default
         if x is None: x=0
         hneeded = self.amgr.maxHeight+3
@@ -135,7 +153,7 @@ class HelpPane:
         self.scr.erase()
         self.scr.box()
         self.amgr.draw(self.scr, y=1, x=2, **kwargs)
-        self.scr.refresh()
+        self.scr.noutrefresh()
 @VisiData.api
@@ -176,13 +194,12 @@ BaseSheet.bindkey('gKEY_BACKSPACE', 'sysopen-help')
 HelpSheet.addCommand(None, 'exec-command', 'quit(sheet); draw_all(); activeStack[0].execCommand(cursorRow.longname)', 'execute command on undersheet')
 BaseSheet.addCommand(None, 'open-tutorial-visidata', 'launchBrowser("https://jsvine.github.io/intro-to-visidata/")', 'open https://jsvine.github.io/intro-to-visidata/')
-vd.addMenuItem("Help", "VisiData tutorial", 'open-tutorial-visidata')
-vd.addMenuItem("Help", 'Sheet commands', 'help-commands')
-vd.addMenuItem("Help", 'All commands', 'help-commands-all')
 vd.addGlobals(HelpSheet=HelpSheet)
 vd.addMenuItems('''
+    Help > VisiData tutorial > open-tutorial-visidata
+    Help > All commands > help-commands-all
     Help > Quick reference > sysopen-help
     Help > Command list > help-commands
 ''')

visidata/indexsheet.py CHANGED Viewed

@@ -99,7 +99,7 @@ BaseSheet.addCommand('g<', 'open-source-prev', 'vd.replace(openSource(source.nex
 IndexSheet.addCommand('g^R', 'reload-selected', 'reloadSheets(selectedRows or rows)', 'reload all selected sheets')
 # when diving into a sheet, remove the index unless it is precious
-SheetsSheet.addCommand('gC', 'columns-selected', 'vd.push(ColumnsSheet("all_columns", source=selectedRows))', 'open Columns Sheet with all visible columns from selected sheets')
+IndexSheet.addCommand('gC', 'columns-selected', 'vd.push(ColumnsSheet("all_columns", source=selectedRows))', 'open Columns Sheet with all visible columns from selected sheets')
 IndexSheet.addCommand('^C', 'cancel-row', 'cancelThread(*cursorRow.currentThreads)', 'abort async thread for current sheet')
 IndexSheet.addCommand('gz^C', 'cancel-rows', 'for vs in selectedRows: cancelThread(*vs.currentThreads)', 'abort async threads for selected sheets')
 SheetsSheet.addCommand('Enter', 'open-row', 'dest=cursorRow; vd.sheets.remove(sheet) if not sheet.precious else None; vd.push(openRow(dest))', 'open sheet referenced in current row')

visidata/loaders/_pandas.py CHANGED Viewed

@@ -28,7 +28,7 @@ def save_dta(vd, p, *sheets):
     vs = sheets[0]
     columns = [col.name for col in vs.visibleCols]
     # Get data types
     types = list()
     dispvals = next(vs.iterdispvals(format=True))
@@ -154,6 +154,8 @@ class PandasSheet(Sheet):
                 readfunc = self.read_tsv
             elif filetype == 'jsonl':
                 readfunc = partial(pd.read_json, lines=True)
+            elif filetype == 'hdf5':
+                readfunc = partial(pd.read_hdf, lines=True)
             else:
                 readfunc = getattr(pd, 'read_'+filetype) or vd.error('no pandas.read_'+filetype)
             # readfunc() handles binary and text open()

visidata/loaders/archive.py CHANGED Viewed

@@ -2,21 +2,25 @@ import pathlib
 import tarfile
 import zipfile
 import datetime
+import os.path
 from visidata.loaders import unzip_http
 from visidata import vd, VisiData, asyncthread, Sheet, Progress, Menu, options
-from visidata import ColumnAttr, Column, Path
+from visidata import ColumnAttr, Column, Path, filesize
 from visidata.type_date import date
 @VisiData.api
 def guess_zip(vd, p):
     if not p.is_url() and zipfile.is_zipfile(p.open_bytes()):
-        return dict(filetype='zip')
+        return dict(filetype='zip', _likelihood=10)
 @VisiData.api
 def guess_tar(vd, p):
+    # an empty file will pass is_tarfile(), but can't be opened by tarfile.open()
+    if filesize(p) == 0:
+        return None
     if tarfile.is_tarfile(p.open_bytes()):
-        return dict(filetype='tar')
+        return dict(filetype='tar', _likelihood=10)
 @VisiData.api
 def open_zip(vd, p):
@@ -81,13 +85,13 @@ Commands:
             return vd.openSource(Path(fi.filename, fp=fp, filesize=fi.file_size), filetype=options.filetype)
     def extract(self, *rows, path=None):
-        path = path or pathlib.Path('.')
+        path = path or Path('.')
         files = []
         for row in rows:
             r, _ = row
             vd.confirmOverwrite(path/r.filename)  #1452
-            self.extract_async(row)
+            self.extract_async(row, path=path)
     def sysopen_row(self, row):
         'Extract file in row to tempdir and launch $EDITOR.  Modifications will be discarded.'
@@ -109,6 +113,12 @@ Commands:
             if '://' in str(self.source):
                 unzip_http.warning = vd.warning
                 self._zfp = unzip_http.RemoteZipFile(str(self.source))
+            elif isinstance(self.source, Path):
+                if self.source.has_fp():  #when opening a zip inside tar or zip
+                    fp = self.source.open('rb')
+                else:
+                    fp = self.source
+                self._zfp = zipfile.ZipFile(fp, 'r')
             else:
                 self._zfp = zipfile.ZipFile(str(self.source), 'r')
@@ -119,18 +129,35 @@ Commands:
             yield [zi, Path(zi.filename)]
+#from https://docs.python.org/3/library/tarfile.html#tarfile.REGTYPE
+tarfile_type_names = {
+    tarfile.REGTYPE:"file",
+    tarfile.AREGTYPE:"file",
+    tarfile.LNKTYPE:"hard link",
+    tarfile.SYMTYPE:"symbolic link",
+    tarfile.CHRTYPE:"character device",
+    tarfile.BLKTYPE:"block device",
+    tarfile.DIRTYPE:"directory",
+    tarfile.FIFOTYPE:"FIFO",
+    tarfile.CONTTYPE:"contiguous file",
+    tarfile.GNUTYPE_LONGNAME:"GNU tar longname",
+    tarfile.GNUTYPE_LONGLINK:"GNU tar longlink",
+    tarfile.GNUTYPE_SPARSE:"GNU tar sparse file",
+}
 class TarSheet(Sheet):
     'Wrapper for `tarfile` library.'
     rowtype = 'files' # rowdef TarInfo
     columns = [
         ColumnAttr('name'),
+        Column('ext', getter=lambda col,row: row.isdir() and '/' or os.path.splitext(row.name)[1][1:]),
         ColumnAttr('size', type=int),
         ColumnAttr('mtime', type=date),
-        ColumnAttr('type', type=int),
+        Column('type', getter=lambda col, row: tarfile_type_names.get(row.type, 'unknown')),
         ColumnAttr('mode', type=int),
         ColumnAttr('uname'),
         ColumnAttr('gname')
     ]
+    nKeys=1
     def openRow(self, fi):
             tfp = tarfile.open(name=str(self.source))

visidata/loaders/csv.py CHANGED Viewed

@@ -12,6 +12,13 @@ vd.option('csv_lineterminator', '\r\n', 'lineterminator passed to csv.writer', r
 vd.option('safety_first', False, 'sanitize input/output to handle edge cases, with a performance cost', replay=True)
+@VisiData.api
+def guess_csv_delimiter(vd, p):
+    'If csv_delimiter option has been modified from default, assume CSV format.'
+    if vd.options.csv_delimiter != vd.options.getdefault('csv_delimiter'):
+        return dict(filetype='csv', _likelihood=2)
 @VisiData.api
 def guess_csv(vd, p):
     import csv
@@ -26,7 +33,11 @@ def guess_csv(vd, p):
         for csvopt in dir(dialect):
             if not csvopt.startswith('_'):
-                r['csv_'+csvopt] = getattr(dialect, csvopt)
+                v = getattr(dialect, csvopt)
+                optname = 'csv_'+csvopt
+                r[optname] = v
+                if vd.options.get(optname) != v:
+                    vd.warning(f'guessed option {optname}={v}')
         return r

visidata/loaders/eml.py CHANGED Viewed

@@ -6,6 +6,8 @@ from visidata import VisiData, vd, Column, TableSheet, vlen
 def open_eml(vd, p):
     return EmailSheet(p.base_stem, source=p)
+open_mhtml = open_eml
 class EmailSheet(TableSheet):
     rowtype = 'parts'  # rowdef: sub-Messages
     columns = [

visidata/loaders/f5log.py CHANGED Viewed

@@ -14,7 +14,7 @@ Regex: (?:/Common/)(?P<site>[^-]+)-(?P<vstype>[^-]+)-(?P<application>[^-]+)
 /Common/newyork-www-banking1
-... | site    | vstype | appliction | ...
+... | site    | vstype | application | ...
 ... | newyork | www    | banking1   | ...
 Adding to .visidatarc
@@ -313,7 +313,7 @@ class F5LogSheet(Sheet):
             cmd_data = msg[cmd_data_loc + 1 :]
             # split the message and the command
             msg, cmd = msg[:cmd_data_loc].rsplit(" ", maxsplit=1)
-            # strip off the trailling " -" from the message
+            # strip off the trailing " -" from the message
             msg = msg[:-2]
             object = cmd_data.split('"', maxsplit=2)
             if len(object) == 3:

visidata/loaders/fec.py CHANGED Viewed

@@ -106,22 +106,19 @@ class DiveSheet(Sheet):
                     self.addRow(item)
                 except Exception as e:
-                    vd.warning("Can't dive on lists with heterogenous item types.")
+                    vd.warning("Can't dive on lists with heterogeneous item types.")
                     return False
     def openRow(self, row):
         if self.is_keyvalue:
             cell = row["value"]
-            name = vd.joinSheetnames(self.name, row["key"])
             if isinstance(cell, (list, dict)):
-                vs = self.__class__(name, source = cell)
+                vs = self.__class__(self.name, row["key"], source = cell)
             else:
                 vd.warning("Nothing to dive into.")
                 return
         else:
-            name = vd.joinSheetnames(self.name, "row")
-            vs = self.__class__(name, source = self.row)
+            vs = self.__class__(self.name, "row", source = self.row)
         success = vs.reload()
         if success == False:
@@ -174,7 +171,7 @@ class FECScheduleSheet(Sheet):
         for schedule_name in self.source.keys():
             vs = FECItemizationSheet(
-                vd.joinSheetnames(self.name, schedule_name),
+                self.name, schedule_name,
                 schedule_name = schedule_name,
                 source = self.source[schedule_name],
                 size = len(self.source[schedule_name]),
@@ -225,7 +222,7 @@ class FECFiling(Sheet):
                 ] else dict
             vs = cls(
-                vd.joinSheetnames(self.name, component_name),
+                self.name, component_name,
                 component_name = component_name,
                 source = source_cls(),
                 size = 0,
@@ -270,7 +267,7 @@ class FECFiling(Sheet):
                 if form_type not in sheet_row.source:
                     sheet_row.source[form_type] = [ ]
                     subsheet = FECItemizationSheet(
-                        vd.joinSheetnames(sheet_row.name, form_type),
+                        sheet_row.name, form_type,
                         schedule_name = form_type,
                         source = [ ],
                         size = 0,

visidata/loaders/fixed_width.py CHANGED Viewed

@@ -110,3 +110,5 @@ def save_fixed(vd, p, *vsheets):
                     for col, val in dispvals.items():
                         fp.write(('{0:%s%s.%s} ' % ('>' if vd.isNumeric(col) else '<', widths[col], widths[col])).format(val))
                     fp.write('\n')
+FixedWidthColumnsSheet.options.null_value = ''    # the file format cannot contain None, so use empty string instead

visidata/loaders/hdf5.py CHANGED Viewed

@@ -1,4 +1,5 @@
-from visidata import VisiData, vd, Sheet, Path, Column, ItemColumn, BaseSheet
+from visidata import VisiData, vd, Sheet, Path, Column, ItemColumn, BaseSheet, anytype
+from itertools import chain
 @VisiData.api
 def open_h5(vd, p):
@@ -6,8 +7,11 @@ def open_h5(vd, p):
 VisiData.open_hdf5 = VisiData.open_h5
+vd.option('hdf5_matrix_enumerate', False, 'enumerate matrix rows and columns')
 class Hdf5ObjSheet(Sheet):
     'Support sheets in HDF5 format.'
     def iterload(self):
         h5py = vd.importExternal('h5py')
         source = self.source
@@ -26,25 +30,39 @@ class Hdf5ObjSheet(Sheet):
             for k, v in source.items():
                 yield Hdf5ObjSheet(self.name, k, source=v)
         elif isinstance(source, h5py.Dataset):
-            if len(source.shape) == 1:
+            if len(source.shape)==1:
                 if source.dtype.names:
-                    for i, colname in enumerate(source.dtype.names):
-                        self.addColumn(ItemColumn(colname, colname), index=i)
+                    for i, (colname, fmt, *_) in enumerate(source.dtype.descr):
+                        if not colname:
+                            colname = f"col{i}"
+                        ctype = _guess_type(fmt)
+                        self.addColumn(ItemColumn(colname, i, type=ctype))
                     yield from source  # copy
                 else:
                     self.addColumn(ItemColumn(source.name, 0))
                     for v in source:
                         yield [v]
-            elif len(source.shape) == 2:  # matrix
+            elif len(source.shape)==2:
+                matrix_enumerate = bool(self.options.hdf5_matrix_enumerate)
                 ncols = source.shape[1]
-                for i in range(ncols):
-                    self.addColumn(ItemColumn('', i, width=8), index=i)
-                self.recalc()
-                yield from source  # copy
+                ctype = _guess_type(source.dtype.descr[0][1])
+                if matrix_enumerate:
+                    self.addColumn(ItemColumn("row", 0, width=8, keycol=1, type=int), index=0)
+                    for i in range(ncols):
+                        self.addColumn(ItemColumn(f'col{i}', i+1, width=8, type=ctype), index=i+1)
+                    self.recalc()
+                    yield from list(list((chain((i,), row))) for i, row in enumerate(source))
+                else:
+                    for i in range(ncols):
+                        self.addColumn(ItemColumn('', i, width=8, type=ctype), index=i)
+                    self.recalc()
+                    yield from source  # copy
             else:
                 vd.fail('too many dimensions in shape %s' % str(source.shape))
         else:
-            vd.fail('unknown h5 object type %s' % type(source))
+            vd.fail(f"too many dimensions in shape {source.shape}")
     def openRow(self, row):
@@ -59,5 +77,11 @@ class Hdf5ObjSheet(Sheet):
         if isinstance(row, numpy.ndarray):
             return NpySheet(None, npy=row)
+def _guess_type(fmt):
+    if 'i' in fmt or 'u' in fmt:
+        return int
+    elif 'f' in fmt:
+        return float
+    return anytype
 Hdf5ObjSheet.addCommand('A', 'dive-metadata', 'vd.push(SheetDict(cursorRow.name + "_attrs", source=cursorRow.attrs))', 'open metadata sheet for object referenced in current row')

visidata 3.1.1__py3-none-any.whl → 3.3__py3-none-any.whl

visidata 3.1.1py3-none-any.whl → 3.3py3-none-any.whl