RubyGems - xnd - Versions diffs - 0.2.0dev3 - Mend

xnd 0.2.0dev3

Files changed (93) hide show

checksums.yaml +7 -0
data/CONTRIBUTING.md +42 -0
data/Gemfile +3 -0
data/History.md +0 -0
data/README.md +7 -0
data/Rakefile +135 -0
data/ext/ruby_xnd/extconf.rb +70 -0
data/ext/ruby_xnd/float_pack_unpack.c +277 -0
data/ext/ruby_xnd/float_pack_unpack.h +39 -0
data/ext/ruby_xnd/gc_guard.c +36 -0
data/ext/ruby_xnd/gc_guard.h +12 -0
data/ext/ruby_xnd/include/xnd.h +449 -0
data/ext/ruby_xnd/lib/libxnd.a +0 -0
data/ext/ruby_xnd/lib/libxnd.so +1 -0
data/ext/ruby_xnd/lib/libxnd.so.0 +1 -0
data/ext/ruby_xnd/lib/libxnd.so.0.2.0dev3 +0 -0
data/ext/ruby_xnd/memory_block_object.c +32 -0
data/ext/ruby_xnd/memory_block_object.h +33 -0
data/ext/ruby_xnd/ruby_xnd.c +1953 -0
data/ext/ruby_xnd/ruby_xnd.h +61 -0
data/ext/ruby_xnd/ruby_xnd_internal.h +85 -0
data/ext/ruby_xnd/util.h +170 -0
data/ext/ruby_xnd/xnd/AUTHORS.txt +5 -0
data/ext/ruby_xnd/xnd/INSTALL.txt +134 -0
data/ext/ruby_xnd/xnd/LICENSE.txt +29 -0
data/ext/ruby_xnd/xnd/MANIFEST.in +3 -0
data/ext/ruby_xnd/xnd/Makefile.in +80 -0
data/ext/ruby_xnd/xnd/README.rst +44 -0
data/ext/ruby_xnd/xnd/config.guess +1530 -0
data/ext/ruby_xnd/xnd/config.h.in +22 -0
data/ext/ruby_xnd/xnd/config.sub +1782 -0
data/ext/ruby_xnd/xnd/configure +4867 -0
data/ext/ruby_xnd/xnd/configure.ac +164 -0
data/ext/ruby_xnd/xnd/doc/Makefile +14 -0
data/ext/ruby_xnd/xnd/doc/_static/copybutton.js +66 -0
data/ext/ruby_xnd/xnd/doc/conf.py +26 -0
data/ext/ruby_xnd/xnd/doc/index.rst +44 -0
data/ext/ruby_xnd/xnd/doc/libxnd/data-structures.rst +186 -0
data/ext/ruby_xnd/xnd/doc/libxnd/functions.rst +148 -0
data/ext/ruby_xnd/xnd/doc/libxnd/index.rst +25 -0
data/ext/ruby_xnd/xnd/doc/releases/index.rst +34 -0
data/ext/ruby_xnd/xnd/doc/xnd/align-pack.rst +96 -0
data/ext/ruby_xnd/xnd/doc/xnd/buffer-protocol.rst +42 -0
data/ext/ruby_xnd/xnd/doc/xnd/index.rst +30 -0
data/ext/ruby_xnd/xnd/doc/xnd/quickstart.rst +62 -0
data/ext/ruby_xnd/xnd/doc/xnd/types.rst +674 -0
data/ext/ruby_xnd/xnd/install-sh +527 -0
data/ext/ruby_xnd/xnd/libxnd/Makefile.in +102 -0
data/ext/ruby_xnd/xnd/libxnd/Makefile.vc +112 -0
data/ext/ruby_xnd/xnd/libxnd/bitmaps.c +345 -0
data/ext/ruby_xnd/xnd/libxnd/contrib.h +313 -0
data/ext/ruby_xnd/xnd/libxnd/copy.c +944 -0
data/ext/ruby_xnd/xnd/libxnd/equal.c +1216 -0
data/ext/ruby_xnd/xnd/libxnd/inline.h +154 -0
data/ext/ruby_xnd/xnd/libxnd/overflow.h +147 -0
data/ext/ruby_xnd/xnd/libxnd/split.c +286 -0
data/ext/ruby_xnd/xnd/libxnd/tests/Makefile.in +39 -0
data/ext/ruby_xnd/xnd/libxnd/tests/Makefile.vc +44 -0
data/ext/ruby_xnd/xnd/libxnd/tests/README.txt +2 -0
data/ext/ruby_xnd/xnd/libxnd/tests/runtest.c +101 -0
data/ext/ruby_xnd/xnd/libxnd/tests/test.h +48 -0
data/ext/ruby_xnd/xnd/libxnd/tests/test_fixed.c +108 -0
data/ext/ruby_xnd/xnd/libxnd/xnd.c +1304 -0
data/ext/ruby_xnd/xnd/libxnd/xnd.h +449 -0
data/ext/ruby_xnd/xnd/python/test_xnd.py +3144 -0
data/ext/ruby_xnd/xnd/python/xnd/__init__.py +290 -0
data/ext/ruby_xnd/xnd/python/xnd/_xnd.c +2822 -0
data/ext/ruby_xnd/xnd/python/xnd/contrib/pretty.py +850 -0
data/ext/ruby_xnd/xnd/python/xnd/docstrings.h +129 -0
data/ext/ruby_xnd/xnd/python/xnd/pyxnd.h +200 -0
data/ext/ruby_xnd/xnd/python/xnd/util.h +182 -0
data/ext/ruby_xnd/xnd/python/xnd_randvalue.py +1121 -0
data/ext/ruby_xnd/xnd/python/xnd_support.py +106 -0
data/ext/ruby_xnd/xnd/setup.py +303 -0
data/ext/ruby_xnd/xnd/vcbuild/INSTALL.txt +42 -0
data/ext/ruby_xnd/xnd/vcbuild/runtest32.bat +16 -0
data/ext/ruby_xnd/xnd/vcbuild/runtest64.bat +14 -0
data/ext/ruby_xnd/xnd/vcbuild/vcbuild32.bat +29 -0
data/ext/ruby_xnd/xnd/vcbuild/vcbuild64.bat +29 -0
data/ext/ruby_xnd/xnd/vcbuild/vcclean.bat +13 -0
data/ext/ruby_xnd/xnd/vcbuild/vcdistclean.bat +14 -0
data/lib/ruby_xnd.so +0 -0
data/lib/xnd.rb +306 -0
data/lib/xnd/monkeys.rb +29 -0
data/lib/xnd/version.rb +6 -0
data/spec/debug_spec.rb +9 -0
data/spec/gc_guard_spec.rb +10 -0
data/spec/leakcheck.rb +9 -0
data/spec/spec_helper.rb +877 -0
data/spec/type_inference_spec.rb +81 -0
data/spec/xnd_spec.rb +2921 -0
data/xnd.gemspec +47 -0
metadata +215 -0

data/ext/ruby_xnd/xnd/doc/libxnd/functions.rst ADDED

@@ -0,0 +1,148 @@
+.. meta::
+   :robots: index,follow
+   :description: libndtypes documentation
+.. sectionauthor:: Stefan Krah <skrah at bytereef.org>
+Functions
+=========
+Create typed memory blocks
+--------------------------
+The main use case for libxnd is to create and manage typed memory blocks.
+These blocks are fully initialized to *0*.  References to additional memory
+blocks are allocated and initialized recursively.
+*bytes* and *string* types are initialized to :c:macro:`NULL`, since their
+actual length is not known yet.
+.. topic:: xnd_empty_from_string
+.. code-block:: c
+   xnd_master_t *xnd_empty_from_string(const char *s, uint32_t flags, ndt_context_t *ctx);
+Return a new master buffer according to the type string in *s*.  *flags*
+must include :c:macro:`XND_OWN_TYPE`.
+.. topic:: xnd_empty_from_type
+.. code-block:: c
+   xnd_master_t *xnd_empty_from_type(const ndt_t *t, uint32_t flags, ndt_context_t *ctx);
+Return a new master buffer according to *type*.  *flags* must not include
+:c:macro:`XND_OWN_TYPE`, i.e. the type is externally managed.
+This is the case in the Python bindings, where the ndtypes module creates
+and manages types.
+Delete typed memory blocks
+--------------------------
+.. topic:: xnd_del
+.. code-block:: c
+   void xnd_del(xnd_master_t *x);
+Delete the master buffer according to its flags. *x* may be :c:macro:`NULL`.
+*x->master.ptr* and *x->master.type* may be :c:macro:`NULL`.
+The latter situation should only arise when breaking up reference cycles.
+This is used in the Python module.
+Bitmaps
+-------
+.. topic:: xnd_bitmap_next
+.. code-block:: c
+   xnd_bitmap_t xnd_bitmap_next(const xnd_t *x, int64_t i, ndt_context_t *ctx);
+Get the next bitmap for the *Tuple*, *Record*, *Ref* and *Constr* types.
+This is a convenience function that checks if the types have optional
+subtrees.
+If yes, return the bitmap at index *i*.  If not, it return an empty bitmap
+that must not be accessed.
+.. topic:: xnd_set_valid
+.. code-block:: c
+   void xnd_set_valid(xnd_t *x);
+Set the validity bit at *x->index*.  *x* must have an optional type.
+.. topic:: xnd_set_na
+.. code-block:: c
+   void xnd_set_na(xnd_t *x);
+Clear the validity bit at *x->index*.  *x* must have an optional type.
+.. topic:: xnd_is_valid
+.. code-block:: c
+   int xnd_is_valid(const xnd_t *x);
+Check if the element at *x->index* is valid.  If *x* does not have an optional
+type, return *1*.  Otherwise, return the validity bit (zero or nonzero).
+.. topic:: xnd_is_na
+.. code-block:: c
+   int xnd_is_na(const xnd_t *x);
+Check if the element at *x->index* is valid.  If *x* does not have an optional
+type, return *0*.  Otherwise, return the negation of the validity bit.
+.. topic:: xnd_subtree
+.. code-block:: c
+   xnd_t xnd_subtree(const xnd_t *x, const xnd_index_t indices[], int len,
+                     ndt_context_t *ctx);
+Apply zero or more indices to the input *x* and return a typed view. Valid
+indices are integers or strings for record fields.
+This function is more general than pure array indexing, hence the name. For
+example, it is possible to index into nested records that in turn contain
+arrays.
+.. topic:: xnd_multikey
+.. code-block:: c
+   xnd_t xnd_multikey(const xnd_t *x, const xnd_index_t indices[], int len,
+                      ndt_context_t *ctx);
+Apply zero or more keys to the input *x* and return a typed view. Valid
+keys are integers or slices.
+This function differs from :c:func:`xnd_subtree` in that it allows
+mixed indexing and slicing for fixed dimensions.  Records and tuples
+cannot be sliced.
+Variable dimensions can be sliced, but do not support mixed indexing
+and slicing.

data/ext/ruby_xnd/xnd/doc/libxnd/index.rst ADDED

@@ -0,0 +1,25 @@
+.. meta::
+   :robots: index, follow
+   :description: libxnd documentation
+   :keywords: libxnd, C, array computing
+.. sectionauthor:: Stefan Krah <skrah at bytereef.org>
+libxnd
+------
+libxnd implements support for typed memory blocks using the libndtypes
+type library.
+Types include ndarrays, ragged arrays (compatible with the Arrow list type),
+optional data (bitmaps are compatible with Arrow), tuples, records (structs),
+strings, bytes and categorical values.
+.. toctree::
+   data-structures.rst
+   functions.rst

data/ext/ruby_xnd/xnd/doc/releases/index.rst ADDED

@@ -0,0 +1,34 @@
+.. meta::
+   :robots: index, follow
+   :description: libndtypes documentation
+   :keywords: libndtypes, C, array computing
+.. sectionauthor:: Stefan Krah <skrah at bytereef.org>
+========
+Releases
+========
+v0.2.0b2 (February 5th 2018)
+============================
+Second release (beta2). This release addresses several build and packaging issues:
+  - Avoid copying libraries into the Python package if system libraries are used.
+  - The build and install partially relied on the dev setup (ndtypes checked out
+    in the xnd directory).  This dependency has been removed.
+  - The conda build now supports separate library and Python module installs.
+  - Configure now has a **–without-docs** option for skipping the doc install.
+v0.2.0b1 (January 20th 2018)
+============================
+First release (beta1).

data/ext/ruby_xnd/xnd/doc/xnd/align-pack.rst ADDED

@@ -0,0 +1,96 @@
+.. meta::
+   :robots: index,follow
+   :description: xnd container
+   :keywords: xnd, alignment, packing
+.. sectionauthor:: Stefan Krah <skrah at bytereef.org>
+Alignment and packing
+=====================
+The xnd memory allocators support explicit alignment.  Alignment is specified
+in the types.
+Tuples and records
+------------------
+Tuples and records have the *align* and *pack* keywords that have the same
+purpose as gcc's *aligned* and *packed* struct attributes.
+Field alignment
+~~~~~~~~~~~~~~~
+The *align* keyword can be used to specify an alignment that is greater
+than the natural alignment of a field:
+.. doctest::
+   >>> from xnd import *
+   >>> s = "(uint8, uint64 |align=32|, uint64)"
+   >>> x = xnd.empty(s)
+   >>> x.align
+   32
+   >>> x.type.datasize
+   64
+Field packing
+~~~~~~~~~~~~~
+The *pack* keyword can be used to specify an alignment that is smaller
+than the natural alignment of a field:
+.. doctest::
+   >>> s = "(uint8, uint64 |pack=2|, uint64)"
+   >>> x = xnd.empty(s)
+   >>> x.align
+   8
+   >>> x.type.datasize
+   24
+Struct packing
+~~~~~~~~~~~~~~
+The *pack* and *align* keywords can be applied to the entire struct:
+.. doctest::
+   >>> s = "(uint8, uint64, uint64, pack=1)"
+   >>> x = xnd.empty(s)
+   >>> x.align
+   1
+   >>> x.type.datasize
+   17
+Individual field and struct directives are mutually exclusive:
+.. doctest::
+   >>> s = "2 * (uint8 |align=16|, uint64, pack=1)"
+   >>> x = xnd.empty(s)
+   Traceback (most recent call last):
+     File "<stdin>", line 1, in <module>
+   ValueError: cannot have 'pack' tuple attribute and field attributes
+Array alignment
+~~~~~~~~~~~~~~~
+An array has the same alignment as its elements:
+.. doctest::
+   >>> s = "2 * (uint8, uint64, pack=1)"
+   >>> x = xnd.empty(s)
+   >>> x.align
+   1
+   >>> x.type.datasize
+   18

data/ext/ruby_xnd/xnd/doc/xnd/buffer-protocol.rst ADDED

@@ -0,0 +1,42 @@
+.. meta::
+   :robots: index,follow
+   :description: xnd container
+   :keywords: xnd, buffer protocol
+.. sectionauthor:: Stefan Krah <skrah at bytereef.org>
+Buffer protocol
+===============
+xnd supports importing PEP-3118 buffers.
+From NumPy
+----------
+Import a simple ndarray:
+.. doctest::
+   >>> import numpy as np
+   >>> from xnd import *
+   >>> x = np.array([[[0,1,2], [3,4,5]], [[6,7,8], [9,10,11]]])
+   >>> y = xnd.from_buffer(x)
+   >>> y.type
+   ndt("2 * 2 * 3 * int64")
+   >>> y.value
+   [[[0, 1, 2], [3, 4, 5]], [[6, 7, 8], [9, 10, 11]]]
+Import an ndarray with a struct dtype:
+.. doctest::
+   >>> x = np.array([(1000, 400.25, 'abc'), (-23, -1e10, 'cba')],
+   ...              dtype=[('x', '<i4'), ('y', '>f4'), ('z', 'S3')])
+   >>> y = xnd.from_buffer(x)
+   >>> y.type
+   ndt("2 * {x : int32, y : >float32, z : fixed_bytes(size=3)}")
+   >>> y.value
+   [{'x': 1000, 'y': 400.25, 'z': b'abc'}, {'x': -23, 'y': -10000000000.0, 'z': b'cba'}]

data/ext/ruby_xnd/xnd/doc/xnd/index.rst ADDED

@@ -0,0 +1,30 @@
+.. meta::
+   :robots: index, follow
+   :description: xnd documentation
+   :keywords: memory blocks, unboxed values, array computing, Python
+.. sectionauthor:: Stefan Krah <skrah at bytereef.org>
+xnd
+---
+The xnd module implements a container type that maps most Python values
+relevant for scientific computing directly to typed memory.
+Whenever possible, a single, pointer-free memory block is used.
+xnd supports ragged arrays, categorical types, indexing, slicing, aligned memory blocks and type inference.
+Operations like indexing and slicing return zero-copy typed views on the data.
+Importing PEP-3118 buffers is supported.
+.. toctree::
+   :maxdepth: 1
+   types.rst
+   align-pack.rst
+   buffer-protocol.rst
+   quickstart.rst

data/ext/ruby_xnd/xnd/doc/xnd/quickstart.rst ADDED

@@ -0,0 +1,62 @@
+.. meta::
+   :robots: index,follow
+   :description: xnd quickstart
+   :keywords: xnd, install
+.. sectionauthor:: Stefan Krah <skrah at bytereef.org>
+Quick Start
+===========
+Prerequisites
+~~~~~~~~~~~~~
+Python2 is not supported. If not already present, install the Python3
+development packages:
+.. code-block:: sh
+   # Debian, Ubuntu:
+   sudo apt-get install gcc make
+   sudo apt-get install python3-dev
+   # Fedora, RedHat:
+   sudo yum install gcc make
+   sudo yum install python3-devel
+   # openSUSE:
+   sudo zypper install gcc make
+   sudo zypper install python3-devel
+   # BSD:
+   # You know what to do.
+   # Mac OS X:
+   # Install Xcode and Python 3 headers.
+Install
+~~~~~~~
+If `pip <http://pypi.python.org/pypi/pip>`_ is present on the system, installation
+should be as easy as:
+.. code-block:: sh
+   pip install xnd
+Otherwise:
+.. code-block:: sh
+   tar xvzf xnd.2.0b1.tar.gz
+   cd xnd.2.0b1
+   python3 setup.py install
+Windows
+~~~~~~~
+Refer to the instructions in the *vcbuild* directory in the source distribution.

data/ext/ruby_xnd/xnd/doc/xnd/types.rst ADDED

@@ -0,0 +1,674 @@
+.. meta::
+   :robots: index,follow
+   :description: xnd container
+   :keywords: xnd, types, examples
+.. sectionauthor:: Stefan Krah <skrah at bytereef.org>
+Types
+=====
+The xnd object is a container that maps a wide range of Python values directly
+to memory.  xnd unpacks complex types of arbitrary nesting depth to a single
+memory block.
+Pointers only occur in explicit pointer types like *Ref* (reference), *Bytes*
+and *String*, but not in the general case.
+Type inference
+--------------
+If no explicit type is given, xnd supports type inference by assuming
+types for the most common Python values.
+Fixed arrays
+~~~~~~~~~~~~
+.. doctest::
+   >>> from xnd import *
+   >>> x = xnd([[0, 1, 2], [3, 4, 5]])
+   >>> x
+   xnd([[0, 1, 2], [3, 4, 5]], type='2 * 3 * int64')
+As expected, lists are mapped to ndarrays and integers to int64.  Indexing and
+slicing works the usual way.  For performance reasons these operations return
+zero-copy views whenever possible:
+.. doctest::
+   >>> x[0][1] # Indexing returns views, even for scalars.
+   xnd(1, type='int64')
+   >>>
+   >>> y = x[:, ::-1] # Containers are returned as views.
+   >>> y
+   xnd([[2, 1, 0], [5, 4, 3]], type='2 * 3 * int64')
+Subarrays are views and properly typed:
+.. doctest::
+   >>> x[1]
+   xnd([3, 4, 5], type='3 * int64')
+The representation of large values is abbreviated:
+.. doctest::
+   >>> x = xnd(10 * [200 * [1]])
+   >>> x
+   xnd([[1, 1, 1, 1, 1, 1, 1, 1, 1, ...],
+        [1, 1, 1, 1, 1, 1, 1, 1, 1, ...],
+        [1, 1, 1, 1, 1, 1, 1, 1, 1, ...],
+        [1, 1, 1, 1, 1, 1, 1, 1, 1, ...],
+        [1, 1, 1, 1, 1, 1, 1, 1, 1, ...],
+        [1, 1, 1, 1, 1, 1, 1, 1, 1, ...],
+        [1, 1, 1, 1, 1, 1, 1, 1, 1, ...],
+        [1, 1, 1, 1, 1, 1, 1, 1, 1, ...],
+        [1, 1, 1, 1, 1, 1, 1, 1, 1, ...],
+        ...],
+       type='10 * 200 * int64')
+Values can be accessed in full using the *value* property:
+.. doctest::
+   >>> x = xnd(11 * [1])
+   >>> x
+   xnd([1, 1, 1, 1, 1, 1, 1, 1, 1, ...], type='11 * int64')
+   >>> x.value
+   [1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1]
+Types can be accessed using the *type* property:
+.. doctest::
+   >>> x = xnd(11 * [1])
+   >>> x.type
+   ndt("11 * int64")
+Ragged arrays
+~~~~~~~~~~~~~
+Ragged arrays are compatible with the Arrow list representation. The data
+is pointer-free, addressing the elements works by having one offset array
+per dimension.
+.. doctest::
+   >>> xnd([[0.1j], [3+2j, 4+5j, 10j]])
+   xnd([[0.1j], [(3+2j), (4+5j), 10j]], type='var * var * complex128')
+Indexing and slicing works as usual, returning properly typed views or
+values in the case of scalars:
+.. doctest::
+   >>> x = xnd([[0.1j], [3+2j, 4+5j, 10j]])
+   >>> x[1, 2]
+   xnd(10j, type='complex128')
+   >>> x[1]
+   xnd([(3+2j), (4+5j), 10j], type='var * complex128')
+Eliminating dimensions through mixed slicing and indexing is not supported
+because it would require copying and adjusting potentially huge offset arrays:
+.. doctest::
+   >>> y = x[:, 1]
+   Traceback (most recent call last):
+     File "<stdin>", line 1, in <module>
+   IndexError: mixed indexing and slicing is not supported for var dimensions
+Records (structs)
+~~~~~~~~~~~~~~~~~
+From Python 3.6 on, dicts retain their order, so they can be used directly
+for initializing C structs.
+.. doctest::
+   >>> xnd({'a': 'foo', 'b': 10.2})
+   xnd({'a': 'foo', 'b': 10.2}, type='{a : string, b : float64}')
+Tuples
+~~~~~~
+Python tuples are directly translated to the libndtypes tuple type:
+.. doctest::
+   >>> xnd(('foo', b'bar', [None, 10.0, 20.0]))
+   xnd(('foo', b'bar', [None, 10.0, 20.0]), type='(string, bytes, 3 * ?float64)')
+Nested arrays in structs
+~~~~~~~~~~~~~~~~~~~~~~~~
+xnd seamlessly supports nested values of arbitrary depth:
+.. doctest::
+   >>> lst = [{'name': 'John', 'internet_points': [1, 2, 3]},
+   ...        {'name': 'Jane', 'internet_points': [4, 5, 6]}]
+   >>> xnd(lst)
+   xnd([{'name': 'John', 'internet_points': [1, 2, 3]}, {'name': 'Jane', 'internet_points': [4, 5, 6]}],
+       type='2 * {name : string, internet_points : 3 * int64}')
+Optional data (missing values)
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+Optional data is currently specified using *None*.  It is under debate if
+a separate *NA* singleton object would be more suitable.
+.. doctest::
+   >>> lst = [0, 1, None, 2, 3, None, 5, 10]
+   >>> xnd(lst)
+   xnd([0, 1, None, 2, 3, None, 5, 10], type='8 * ?int64')
+Categorical data
+~~~~~~~~~~~~~~~~
+Type inference would be ambiguous, so it cannot work directly. xnd supports
+the *levels* argument that is internally translated to the type.
+.. doctest::
+   >>> levels = ['January', 'August', 'December', None]
+   >>> x = xnd(['January', 'January', None, 'December', 'August', 'December', 'December'], levels=levels)
+   >>> x.value
+   ['January', 'January', None, 'December', 'August', 'December', 'December']
+   >>> x.type
+   ndt("7 * categorical('January', 'August', 'December', NA)")
+The above is equivalent to specifying the type directly:
+.. doctest::
+   >>> from ndtypes import *
+   >>> t = ndt("7 * categorical('January', 'August', 'December', NA)")
+   >>> x = xnd(['January', 'January', None, 'December', 'August', 'December', 'December'], type=t)
+   >>> x.value
+   ['January', 'January', None, 'December', 'August', 'December', 'December']
+   >>> x.type
+   ndt("7 * categorical('January', 'August', 'December', NA)")
+Explicit types
+--------------
+While type inference is well-defined, it necessarily makes assumptions about
+the programmer's intent.
+There are two cases where types should be given:
+Different types are intended
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+.. doctest::
+   >>> xnd([[0,1,2], [3,4,5]], type="2 * 3 * uint8")
+   xnd([[0, 1, 2], [3, 4, 5]], type='2 * 3 * uint8')
+Here, type inference would deduce :c:macro:`int64`, so :c:macro:`uint8` needs
+to be passed explicitly.
+Performance
+~~~~~~~~~~~
+For large arrays, explicit types are significantly faster.  Type inference
+supports arbitrary nesting depth, is complex and still implemented in pure
+Python. Compare:
+.. doctest::
+   >>> lst = [1] * 1000000
+   >>> x = xnd(lst) # inference
+   >>>
+   >>> x = xnd(lst, type='1000000 * int64') # explicit
+All supported types
+-------------------
+Fixed arrays
+~~~~~~~~~~~~
+Fixed arrays are similar to NumPy's ndarray. One difference is that internally
+xnd uses steps instead of strides. One step is the amount of indices required
+to move the linear index from one dimension element to the next.
+This facilitates optional data, whose bitmaps need to be addressed by the
+linear index.  The equation *stride = step * itemsize* always holds.
+.. doctest::
+   >>> xnd([[[1,2], [None, 3]], [[4, None], [5, 6]]])
+   xnd([[[1, 2], [None, 3]], [[4, None], [5, 6]]], type='2 * 2 * 2 * ?int64')
+This is a fixed array with optional data.
+.. doctest::
+   >>> xnd([(1,2.0,3j), (4,5.0,6j)])
+   xnd([(1, 2.0, 3j), (4, 5.0, 6j)], type='2 * (int64, float64, complex128)')
+An array with tuple elements.
+Fortran order
+~~~~~~~~~~~~~
+Fortran order is specified by prefixing the dimensions with an exclamation mark:
+.. doctest::
+   >>> lst = [[1, 2, 3], [4, 5, 6]]
+   >>> x = xnd(lst, type='!2 * 3 * uint16')
+   >>>
+   >>> x.type.shape
+   (2, 3)
+   >>> x.type.strides
+   (2, 4)
+Alternatively, steps can be passed as arguments to the fixed dimension type:
+.. doctest::
+   >>> from ndtypes import *
+   >>> lst = [[1, 2, 3], [4, 5, 6]]
+   >>> t = ndt("fixed(shape=2, step=1) * fixed(shape=3, step=2) * uint16")
+   >>> x = xnd(lst, type=t)
+   >>> x.type.shape
+   (2, 3)
+   >>> x.type.strides
+   (2, 4)
+Ragged arrays
+~~~~~~~~~~~~~
+Ragged arrays with explicit types are easiest to construct using the *dtype*
+argument to the xnd constructor.
+.. doctest::
+   >>> lst = [[0], [1, 2], [3, 4, 5]]
+   >>> xnd(lst, dtype="int32")
+   xnd([[0], [1, 2], [3, 4, 5]], type='var * var * int32')
+Alternatively, offsets can be passed as arguments to the var dimension type:
+.. doctest::
+   >>> from ndtypes import ndt
+   >>> t = ndt("var(offsets=[0,3]) * var(offsets=[0,1,3,6]) * int32")
+   >>> xnd(lst, type=t)
+   xnd([[0], [1, 2], [3, 4, 5]], type='var * var * int32')
+Tuples
+~~~~~~
+In memory, tuples are the same as C structs.
+.. doctest::
+   >>> xnd(("foo", 1.0))
+   xnd(('foo', 1.0), type='(string, float64)')
+Indexing works the same as for arrays:
+.. doctest::
+   >>> x = xnd(("foo", 1.0))
+   >>> x[0]
+   xnd('foo', type='string')
+Nested tuples are more general than ragged arrays. They can a) hold different
+data types and b) the trees they represent may be unbalanced.
+They do not allow slicing though and are probably less efficient.
+This is an example of an unbalanced tree that cannot be represented as a
+ragged array:
+.. doctest::
+   >>> unbalanced_tree = (((1.0, 2.0), (3.0)), 4.0, ((5.0, 6.0, 7.0), ()))
+   >>> x = xnd(unbalanced_tree)
+   >>> x.value
+   (((1.0, 2.0), 3.0), 4.0, ((5.0, 6.0, 7.0), ()))
+   >>> x.type
+   ndt("(((float64, float64), float64), float64, ((float64, float64, float64), ()))")
+   >>>
+   >>> x[0]
+   xnd(((1.0, 2.0), 3.0), type='((float64, float64), float64)')
+   >>> x[0][0]
+   xnd((1.0, 2.0), type='(float64, float64)')
+Note that the data in the above tree example is packed into a single contiguous
+memory block.
+Records
+~~~~~~~
+In memory, records are C structs. The field names are only stored in the type.
+The following examples use Python-3.6, which keeps the dict initialization
+order.
+.. doctest::
+   >>> x = xnd({'a': b'123', 'b': {'x': 1.2, 'y': 100+3j}})
+   >>> x.value
+   {'a': b'123', 'b': {'x': 1.2, 'y': (100+3j)}}
+   >>> x.type
+   ndt("{a : bytes, b : {x : float64, y : complex128}}")
+Indexing works the same as for arrays. Additionally, fields can be indexed
+by name:
+.. doctest::
+   >>> x[0]
+   xnd(b'123', type='bytes')
+   >>> x['a']
+   xnd(b'123', type='bytes')
+   >>> x['b']
+   xnd({'x': 1.2, 'y': (100+3j)}, type='{x : float64, y : complex128}')
+The nesting depth is arbitrary.  In the following example, the data -- except
+for strings, which are pointers -- is packed into a single contiguous memory
+block:
+.. code-block:: py
+   >>> from pprint import pprint
+   >>> item = {
+   ...   "id": 1001,
+   ...   "name": "cyclotron",
+   ...   "price": 5998321.99,
+   ...   "tags": ["connoisseur", "luxury"],
+   ...   "stock": {
+   ...     "warehouse": 722,
+   ...     "retail": 20
+   ...   }
+   ... }
+   >>> x = xnd(item)
+   >>>
+   >>> pprint(x.value)
+   {'id': 1001,
+    'name': 'cyclotron',
+    'price': 5998321.99,
+    'stock': {'retail': 20, 'warehouse': 722},
+    'tags': ['connoisseur', 'luxury']}
+   >>>
+   >>> x.type.pprint()
+   {
+     id : int64,
+     name : string,
+     price : float64,
+     tags : 2 * string,
+     stock : {
+       warehouse : int64,
+       retail : int64
+     }
+   }
+Strings can be embedded into the array by specifying the fixed string type.
+In this case, the memory block is pointer-free.
+.. code-block:: py
+   >>> from ndtypes import ndt
+   >>>
+   >>> t = """
+   ...   { id : int64,
+   ...     name : fixed_string(30),
+   ...     price : float64,
+   ...     tags : 2 * fixed_string(30),
+   ...     stock : {warehouse : int64, retail : int64}
+   ...   }
+   ... """
+   >>>
+   >>> x = xnd(item, type=t)
+   >>> x.type.pprint()
+   {
+     id : int64,
+     name : fixed_string(30),
+     price : float64,
+     tags : 2 * fixed_string(30),
+     stock : {
+       warehouse : int64,
+       retail : int64
+     }
+   }
+Record of arrays
+~~~~~~~~~~~~~~~~
+Often it is more memory efficient to store an array of records as a record of
+arrays.  This example with columnar data is from the Arrow homepage:
+.. doctest::
+   >>> data = {'session_id': [1331247700, 1331247702, 1331247709, 1331247799],
+   ...         'timestamp': [1515529735.4895875, 1515529746.2128427, 1515529756.4485607, 1515529766.2181058],
+   ...         'source_ip': ['8.8.8.100', '100.2.0.11', '99.101.22.222', '12.100.111.200']}
+   >>> x = xnd(data)
+   >>> x.type
+   ndt("{session_id : 4 * int64, timestamp : 4 * float64, source_ip : 4 * string}")
+References
+~~~~~~~~~~
+References are transparent pointers to new memory blocks (meaning a new
+data pointer, not a whole new xnd buffer).
+For example, this is an array of pointer to array:
+.. doctest::
+   >>> t = ndt("3 * ref(4 * uint64)")
+   >>> lst = [[0,1,2,3], [4,5,6,7], [8,9,10,11]]
+   >>> xnd(lst, type=t)
+   xnd([[0, 1, 2, 3], [4, 5, 6, 7], [8, 9, 10, 11]], type='3 * ref(4 * uint64)')
+The user sees no difference to a regular 3 by 4 array, but internally
+the outer dimension consists of three pointers to the inner arrays.
+For memory blocks generated by xnd itself the feature is not so useful --
+after all, it is usually better to have a single memory block than one
+with additional pointers.
+However, suppose that in the above columnar data example another application
+represents the arrays inside the record with pointers.  Using the *ref* type,
+data structures borrowed from such an application can be properly typed:
+.. doctest::
+   >>> t = ndt("{session_id : &4 * int64, timestamp : &4 * float64, source_ip : &4 * string}")
+   >>> x = xnd(data, type=t)
+   >>> x.type
+   ndt("{session_id : ref(4 * int64), timestamp : ref(4 * float64), source_ip : ref(4 * string)}")
+The ampersand is the shorthand for "ref".
+Constructors
+~~~~~~~~~~~~
+Constructors are xnd's way of creating distinct named types. The constructor
+argument is a regular type.
+Constructors open up a new dtype, so named arrays can be the dtype of
+other arrays.  Type inference currently isn't aware of constructors,
+so types have to be provided.
+.. doctest::
+   >>> t = ndt("3 * SomeMatrix(2 * 2 * float32)")
+   >>> lst = [[[1,2], [3,4]], [[5,6], [7,8]], [[9,10], [11,12]]]
+   >>> x = xnd(lst, type=t)
+   >>> x
+   xnd([[[1.0, 2.0], [3.0, 4.0]], [[5.0, 6.0], [7.0, 8.0]], [[9.0, 10.0], [11.0, 12.0]]],
+       type='3 * SomeMatrix(2 * 2 * float32)')
+   >>> x[0]
+   xnd([[1.0, 2.0], [3.0, 4.0]], type='SomeMatrix(2 * 2 * float32)')
+Categorical
+~~~~~~~~~~~
+Categorical types contain values.  The data stored in xnd buffers are indices
+(:c:macro:`int64`) into the type's categories.
+.. doctest::
+   >>> t = ndt("categorical('a', 'b', 'c', NA)")
+   >>> data = ['a', 'a', 'b', 'a', 'a', 'a', 'foo', 'c']
+   >>> x = xnd(data, dtype=t)
+   >>> x.value
+   ['a', 'a', 'b', 'a', 'a', 'a', None, 'c']
+Fixed String
+~~~~~~~~~~~~
+Fixed strings are embedded into arrays.  Supported encodings are 'ascii',
+'utf8', 'utf16' and 'utf32'. The string size argument denotes the number
+of code points rather than bytes.
+.. doctest::
+   >>> t = ndt("10 * fixed_string(3, 'utf32')")
+   >>> x = xnd.empty(t)
+   >>> x.value
+   ['', '', '', '', '', '', '', '', '', '']
+   >>> x[3] = "\U000003B1\U000003B2\U000003B3"
+   >>> x.value
+   ['', '', '', 'αβγ', '', '', '', '', '', '']
+Fixed Bytes
+~~~~~~~~~~~
+Fixed bytes are embedded into arrays.
+.. doctest::
+   >>> t = ndt("3 * fixed_bytes(size=3)")
+   >>> x = xnd.empty(t)
+   >>> x[2] = b'123'
+   >>> x.value
+   [b'\x00\x00\x00', b'\x00\x00\x00', b'123']
+   >>> x.align
+   1
+Alignment can be requested with the requirement that size is a multiple of
+alignment:
+.. doctest::
+   >>> t = ndt("3 * fixed_bytes(size=32, align=16)")
+   >>> x = xnd.empty(t)
+   >>> x.align
+   16
+String
+~~~~~~
+Strings are pointers to :c:macro:`NUL`-terminated UTF-8 strings.
+.. doctest::
+   >>> x = xnd.empty("10 * string")
+   >>> x.value
+   ['', '', '', '', '', '', '', '', '', '']
+   >>> x[0] = "abc"
+   >>> x.value
+   ['abc', '', '', '', '', '', '', '', '', '']
+Bytes
+~~~~~
+Internally, bytes are structs with a size field and a pointer to the data.
+.. doctest::
+   >>> xnd([b'123', b'45678'])
+   xnd([b'123', b'45678'], type='2 * bytes')
+The bytes constructor takes an optional *align* argument that specifies the
+alignment of the allocated data:
+.. doctest::
+   >>> x = xnd([b'abc', b'123'], type="2 * bytes(align=64)")
+   >>> x.value
+   [b'abc', b'123']
+   >>> x.align
+   8
+Note that *x.align* is the alignment of the array.  The embedded pointers
+to the bytes data are aligned at *64*.
+Primitive types
+~~~~~~~~~~~~~~~
+As a short example, here is a tuple that contains all primitive types:
+.. doctest::
+   >>> s = """
+   ...    (bool,
+   ...     int8, int16, int32, int64,
+   ...     uint8, uint16, uint32, uint64,
+   ...     float16, float32, float64,
+   ...     complex32, complex64, complex128)
+   ... """
+   >>> x = xnd.empty(s)
+   >>> x.value
+   (False, 0, 0, 0, 0, 0, 0, 0, 0, 0.0, 0.0, 0.0, 0j, 0j, 0j)