PyPI - westpa - Versions diffs - 2022.13__cp312-cp312-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl - Mend

westpa 2022.13__cp312-cp312-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (162) hide show

westpa/__init__.py +14 -0
westpa/_version.py +21 -0
westpa/analysis/__init__.py +5 -0
westpa/analysis/core.py +749 -0
westpa/analysis/statistics.py +27 -0
westpa/analysis/trajectories.py +369 -0
westpa/cli/__init__.py +0 -0
westpa/cli/core/__init__.py +0 -0
westpa/cli/core/w_fork.py +152 -0
westpa/cli/core/w_init.py +230 -0
westpa/cli/core/w_run.py +77 -0
westpa/cli/core/w_states.py +212 -0
westpa/cli/core/w_succ.py +99 -0
westpa/cli/core/w_truncate.py +68 -0
westpa/cli/tools/__init__.py +0 -0
westpa/cli/tools/ploterr.py +506 -0
westpa/cli/tools/plothist.py +706 -0
westpa/cli/tools/w_assign.py +597 -0
westpa/cli/tools/w_bins.py +166 -0
westpa/cli/tools/w_crawl.py +119 -0
westpa/cli/tools/w_direct.py +557 -0
westpa/cli/tools/w_dumpsegs.py +94 -0
westpa/cli/tools/w_eddist.py +506 -0
westpa/cli/tools/w_fluxanl.py +376 -0
westpa/cli/tools/w_ipa.py +832 -0
westpa/cli/tools/w_kinavg.py +127 -0
westpa/cli/tools/w_kinetics.py +96 -0
westpa/cli/tools/w_multi_west.py +414 -0
westpa/cli/tools/w_ntop.py +213 -0
westpa/cli/tools/w_pdist.py +515 -0
westpa/cli/tools/w_postanalysis_matrix.py +82 -0
westpa/cli/tools/w_postanalysis_reweight.py +53 -0
westpa/cli/tools/w_red.py +491 -0
westpa/cli/tools/w_reweight.py +780 -0
westpa/cli/tools/w_select.py +226 -0
westpa/cli/tools/w_stateprobs.py +111 -0
westpa/cli/tools/w_timings.py +113 -0
westpa/cli/tools/w_trace.py +599 -0
westpa/core/__init__.py +0 -0
westpa/core/_rc.py +673 -0
westpa/core/binning/__init__.py +55 -0
westpa/core/binning/_assign.c +36018 -0
westpa/core/binning/_assign.cpython-312-aarch64-linux-gnu.so +0 -0
westpa/core/binning/_assign.pyx +370 -0
westpa/core/binning/assign.py +454 -0
westpa/core/binning/binless.py +96 -0
westpa/core/binning/binless_driver.py +54 -0
westpa/core/binning/binless_manager.py +189 -0
westpa/core/binning/bins.py +47 -0
westpa/core/binning/mab.py +506 -0
westpa/core/binning/mab_driver.py +54 -0
westpa/core/binning/mab_manager.py +197 -0
westpa/core/data_manager.py +1761 -0
westpa/core/extloader.py +74 -0
westpa/core/h5io.py +1079 -0
westpa/core/kinetics/__init__.py +24 -0
westpa/core/kinetics/_kinetics.c +45174 -0
westpa/core/kinetics/_kinetics.cpython-312-aarch64-linux-gnu.so +0 -0
westpa/core/kinetics/_kinetics.pyx +815 -0
westpa/core/kinetics/events.py +147 -0
westpa/core/kinetics/matrates.py +156 -0
westpa/core/kinetics/rate_averaging.py +266 -0
westpa/core/progress.py +218 -0
westpa/core/propagators/__init__.py +54 -0
westpa/core/propagators/executable.py +592 -0
westpa/core/propagators/loaders.py +196 -0
westpa/core/reweight/__init__.py +14 -0
westpa/core/reweight/_reweight.c +36899 -0
westpa/core/reweight/_reweight.cpython-312-aarch64-linux-gnu.so +0 -0
westpa/core/reweight/_reweight.pyx +439 -0
westpa/core/reweight/matrix.py +126 -0
westpa/core/segment.py +119 -0
westpa/core/sim_manager.py +839 -0
westpa/core/states.py +359 -0
westpa/core/systems.py +93 -0
westpa/core/textio.py +74 -0
westpa/core/trajectory.py +603 -0
westpa/core/we_driver.py +910 -0
westpa/core/wm_ops.py +43 -0
westpa/core/yamlcfg.py +298 -0
westpa/fasthist/__init__.py +34 -0
westpa/fasthist/_fasthist.c +38755 -0
westpa/fasthist/_fasthist.cpython-312-aarch64-linux-gnu.so +0 -0
westpa/fasthist/_fasthist.pyx +222 -0
westpa/mclib/__init__.py +271 -0
westpa/mclib/__main__.py +28 -0
westpa/mclib/_mclib.c +34610 -0
westpa/mclib/_mclib.cpython-312-aarch64-linux-gnu.so +0 -0
westpa/mclib/_mclib.pyx +226 -0
westpa/oldtools/__init__.py +4 -0
westpa/oldtools/aframe/__init__.py +35 -0
westpa/oldtools/aframe/atool.py +75 -0
westpa/oldtools/aframe/base_mixin.py +26 -0
westpa/oldtools/aframe/binning.py +178 -0
westpa/oldtools/aframe/data_reader.py +560 -0
westpa/oldtools/aframe/iter_range.py +200 -0
westpa/oldtools/aframe/kinetics.py +117 -0
westpa/oldtools/aframe/mcbs.py +153 -0
westpa/oldtools/aframe/output.py +39 -0
westpa/oldtools/aframe/plotting.py +88 -0
westpa/oldtools/aframe/trajwalker.py +126 -0
westpa/oldtools/aframe/transitions.py +469 -0
westpa/oldtools/cmds/__init__.py +0 -0
westpa/oldtools/cmds/w_ttimes.py +361 -0
westpa/oldtools/files.py +34 -0
westpa/oldtools/miscfn.py +23 -0
westpa/oldtools/stats/__init__.py +4 -0
westpa/oldtools/stats/accumulator.py +35 -0
westpa/oldtools/stats/edfs.py +129 -0
westpa/oldtools/stats/mcbs.py +96 -0
westpa/tools/__init__.py +33 -0
westpa/tools/binning.py +472 -0
westpa/tools/core.py +340 -0
westpa/tools/data_reader.py +159 -0
westpa/tools/dtypes.py +31 -0
westpa/tools/iter_range.py +198 -0
westpa/tools/kinetics_tool.py +343 -0
westpa/tools/plot.py +283 -0
westpa/tools/progress.py +17 -0
westpa/tools/selected_segs.py +154 -0
westpa/tools/wipi.py +751 -0
westpa/trajtree/__init__.py +4 -0
westpa/trajtree/_trajtree.c +17829 -0
westpa/trajtree/_trajtree.cpython-312-aarch64-linux-gnu.so +0 -0
westpa/trajtree/_trajtree.pyx +130 -0
westpa/trajtree/trajtree.py +117 -0
westpa/westext/__init__.py +0 -0
westpa/westext/adaptvoronoi/__init__.py +3 -0
westpa/westext/adaptvoronoi/adaptVor_driver.py +214 -0
westpa/westext/hamsm_restarting/__init__.py +3 -0
westpa/westext/hamsm_restarting/example_overrides.py +35 -0
westpa/westext/hamsm_restarting/restart_driver.py +1165 -0
westpa/westext/stringmethod/__init__.py +11 -0
westpa/westext/stringmethod/fourier_fitting.py +69 -0
westpa/westext/stringmethod/string_driver.py +253 -0
westpa/westext/stringmethod/string_method.py +306 -0
westpa/westext/weed/BinCluster.py +180 -0
westpa/westext/weed/ProbAdjustEquil.py +100 -0
westpa/westext/weed/UncertMath.py +247 -0
westpa/westext/weed/__init__.py +10 -0
westpa/westext/weed/weed_driver.py +192 -0
westpa/westext/wess/ProbAdjust.py +101 -0
westpa/westext/wess/__init__.py +6 -0
westpa/westext/wess/wess_driver.py +217 -0
westpa/work_managers/__init__.py +57 -0
westpa/work_managers/core.py +396 -0
westpa/work_managers/environment.py +134 -0
westpa/work_managers/mpi.py +318 -0
westpa/work_managers/processes.py +201 -0
westpa/work_managers/serial.py +28 -0
westpa/work_managers/threads.py +79 -0
westpa/work_managers/zeromq/__init__.py +20 -0
westpa/work_managers/zeromq/core.py +635 -0
westpa/work_managers/zeromq/node.py +131 -0
westpa/work_managers/zeromq/work_manager.py +526 -0
westpa/work_managers/zeromq/worker.py +320 -0
westpa-2022.13.dist-info/METADATA +179 -0
westpa-2022.13.dist-info/RECORD +162 -0
westpa-2022.13.dist-info/WHEEL +7 -0
westpa-2022.13.dist-info/entry_points.txt +30 -0
westpa-2022.13.dist-info/licenses/LICENSE +21 -0
westpa-2022.13.dist-info/top_level.txt +1 -0

westpa/core/reweight/_reweight.cpython-312-aarch64-linux-gnu.so ADDED Viewed

Binary file

westpa/core/reweight/_reweight.pyx ADDED Viewed

@@ -0,0 +1,439 @@
+# A cythoned version of the original function of the stats_process function,
+# based on _kinetics.pyx
+from __future__ import print_function,division
+import cython
+import numpy as np
+import h5py
+from scipy.sparse import csgraph
+import warnings
+from collections import Counter
+cimport numpy as np
+cimport scipy.linalg
+cimport scipy.linalg.cython_lapack as cl
+import scipy.linalg
+from libc.math cimport isnan
+ctypedef np.uint16_t index_t
+ctypedef np.float64_t weight_t
+ctypedef np.uint8_t bool_t
+ctypedef np.int64_t trans_t
+ctypedef np.uintp_t uint_t # 32 bits on 32-bit systems, 64 bits on 64-bit systems
+ctypedef unsigned short Ushort
+ctypedef double complex Cdouble
+weight_dtype = np.float64
+index_dtype = np.uint16
+bool_dtype = np.bool_
+intc_dtype = np.intc
+@cython.boundscheck(False)
+@cython.wraparound(False)
+cpdef stats_process(np.ndarray[index_t, ndim=2] bin_assignments,
+                    np.ndarray[weight_t, ndim=1] weights,
+                    np.ndarray[weight_t, ndim=2] fluxes,
+                    np.ndarray[weight_t, ndim=1] populations,
+                    np.ndarray[trans_t, ndim=2] trans,
+                    np.ndarray[index_t, ndim=2] mask,
+                    str interval='timepoint'                        ):
+    cdef:
+        Py_ssize_t i,k
+        index_t ibin,fbin,nsegs,npts
+    nsegs = bin_assignments.shape[0]
+    npts = bin_assignments.shape[1]
+    if interval == 'timepoint':
+        for i in xrange(0,npts - 1):
+            for k in xrange(nsegs):
+                ibin = bin_assignments[k,i]
+                fbin = bin_assignments[k, i + 1]
+                if mask[k, 0] == 1:
+                    continue
+                w = weights[k]
+                fluxes[ibin, fbin] += w
+                trans[ibin, fbin] += 1
+                populations[ibin] += w
+        return
+    if interval == 'iteration':
+        for k in xrange(nsegs):
+            # Should this be 0?
+            # .... this should super be 0.  What?
+            ibin = bin_assignments[k,0]
+            fbin = bin_assignments[k, npts - 1]
+            if mask[k, 0] == 1:
+                continue
+            w = weights[k]
+            fluxes[ibin, fbin] += w
+            trans[ibin, fbin] += 1
+            populations[ibin] += w
+        return
+@cython.boundscheck(False)
+@cython.wraparound(False)
+@cython.cdivision(True)
+cpdef int normalize(weight_t[:,:] m, Py_ssize_t nfbins) nogil:
+    cdef:
+        weight_t row_sum
+        Py_ssize_t x, y
+    for y in range(nfbins):
+        row_sum = 0
+        for x in range(nfbins):
+            row_sum += m[y,x]
+        if row_sum != 0:
+            for x in range(nfbins):
+                m[y,x] /= row_sum
+    return 0
+@cython.boundscheck(False)
+@cython.wraparound(False)
+@cython.cdivision(True)
+cpdef reweight_for_c(rows, cols, obs, flux, insert, indices, nstates, nbins, state_labels, state_map, nfbins, istate, jstate, stride, bin_last_state_map, bin_state_map, return_obs, obs_threshold=1):
+    # Instead of pulling in start and stop, we'll pull in a list of indices.
+    # This way, it should support the bootstrap.
+    cdef:
+        int[:] _rows, _cols, _obs, _ins, _nrows, _ncols, _nobs, _visited
+        long[:]  _bin_last_state_map
+        weight_t[:] _flux, _total_pop, _rw_bin_probs, _nflux, _rw_color_probs, _rw_state_probs
+        double[:] _eigvals, _eigvalsi
+        int n_trans, _nstates, lind, _nfbins, _stride, _obs_threshold, nnz, nlind, i, j, _istate, _jstate
+        Ushort[:] _indices, _bin_state_map
+        weight_t _return_value
+        Ushort[:] _new_indices
+        weight_t[:,:] _total_fluxes, _transition_matrix, _rw_state_flux, _strong_transition_matrix
+        double[:,:] _WORK, _eigvecs
+        int[:,:] _total_obs, _graph
+        #bint _return_flux, _return_states, _return_color
+        str _return_obs
+        #double[:] eigvals, eigvalsi
+        #double[:,:] eigvecs, WORK
+    # CREATE NUMPY ARRAYS
+    # This is a temporary measure that fixes some segfaults, which implies I'm probably off by
+    # a little bit.  Memory heavy, but whatever.
+    # It breaks depending on things, so I need to root that out.  Clearly, nnz is larger than that.
+    _flux = flux
+    nnz = len(flux)
+    lind = indices.shape[0]
+    nlind = indices.shape[0]*stride
+    total_fluxes = np.zeros((nfbins, nfbins), weight_dtype)
+    total_obs = np.zeros((nfbins, nfbins), intc_dtype)
+    transition_matrix = np.zeros((nfbins, nfbins), weight_dtype)
+    strong_transition_matrix = np.zeros((nfbins, nfbins), weight_dtype)
+    visited = np.zeros((nfbins), intc_dtype)
+    graph = np.zeros((nfbins, nfbins+1), dtype=intc_dtype)
+    rw_bin_probs = np.zeros(nfbins, weight_dtype)
+    new_indices = np.zeros(((nlind)), dtype=indices.dtype)
+    rw_state_flux = np.zeros((nstates, nstates), np.float64)
+    state_flux = np.zeros((nstates, nstates), weight_dtype)
+    eigvals = np.zeros((nfbins), np.float64)
+    eigvalsi = np.zeros((nfbins), np.float64)
+    eigvecs = np.zeros((nfbins, nfbins), np.float64)
+    WORK = np.zeros((nfbins*4, nfbins*4), np.float64)
+    rw_color_probs = np.zeros((nstates), weight_dtype)
+    rw_state_probs = np.zeros((nbins), weight_dtype)
+    # CREATE MEMORYVIEWS
+    # These are for what we sent in...
+    _rows = rows
+    _cols = cols
+    _obs = obs
+    _flux = flux
+    _ins = insert
+    _nstates = nstates
+    # ... these are for functions we'll be using.
+    _total_fluxes = total_fluxes
+    _total_obs = total_obs
+    _transition_matrix = transition_matrix
+    _strong_transition_matrix = strong_transition_matrix
+    _nfbins = nfbins
+    _stride = stride
+    _obs_threshold = obs_threshold
+    _indices = indices
+    _new_indices = new_indices
+    _rw_state_flux = rw_state_flux
+    _rw_bin_probs = rw_bin_probs
+    _eigvals = eigvals
+    _eigvalsi = eigvalsi
+    _eigvals = eigvals
+    _eigvecs = eigvecs
+    _WORK = WORK
+    _graph = graph
+    _visited = visited
+    _rw_color_probs = rw_color_probs
+    _rw_state_probs = rw_state_probs
+    _bin_last_state_map = bin_last_state_map
+    _bin_state_map = bin_state_map
+    _istate = istate
+    _jstate = jstate
+    _return_obs = return_obs
+    #NOGIL
+    # Reconstruct dataset.  We're just passing the same thing back and forth between functions.
+    with nogil:
+        for i in range(_nfbins):
+            for j in range(1, _nfbins+1):
+                _graph[i, j] = _nfbins
+        regenerate_subsampled_indices(_indices, _new_indices, lind, _stride)
+        accumulate_fluxes(_rows, _cols, _obs, _flux, _ins, _new_indices, nnz, _transition_matrix, nlind)
+        accumulate_obs(_rows, _cols, _obs, _flux, _ins, _new_indices, nnz, _total_obs, nlind)
+        remove_under_obs(_transition_matrix, _total_obs, _obs_threshold, _nfbins)
+        normalize(_transition_matrix, _nfbins)
+        steadystate_solve(_transition_matrix, _strong_transition_matrix, _rw_bin_probs, _nfbins, _eigvals, _eigvalsi, _eigvecs, _WORK, _graph, _visited)
+        for i in range(_nfbins):
+            _rw_color_probs[_bin_last_state_map[i]] += _rw_bin_probs[i]
+            _rw_state_probs[_bin_state_map[i]] += _rw_bin_probs[i]
+        calc_state_flux(_transition_matrix, _rw_bin_probs, _bin_last_state_map, _bin_state_map, _nstates, _rw_state_flux, _nfbins)
+    # This allows us to use the same function for all three types.
+    # Return conditional fluxes.
+    if _return_obs == b'F':
+        _return_value = _rw_state_flux[_istate,_jstate]
+        if isnan(_return_value) is True:
+            return 0.0
+        else:
+            return _return_value
+    # Return state probabilities.
+    elif _return_obs == b'S':
+        _return_value = _rw_state_probs[_istate]
+        if isnan(_return_value) is True:
+            return 0.0
+        else:
+            return _return_value
+    # Return color (ensemble) probabilities
+    elif _return_obs == b'C':
+        _return_value = _rw_color_probs[_istate]
+        if isnan(_return_value) is True:
+            return 0.0
+        else:
+            return _return_value
+    # Return the rates.
+    elif _return_obs == b'R':
+        if _rw_color_probs[_istate] != 0.0:
+            _return_value = (_rw_state_flux[_istate,_jstate] / (_rw_color_probs[_istate] / (_rw_color_probs[_istate] + _rw_color_probs[_jstate])))
+            if isnan(_return_value) is True:
+                return 0.0
+            else:
+                return _return_value
+        else:
+            # We have no ensemble probability, and as such, cannot have a flux.
+            return 0.0
+    # Return the populations.
+    elif _return_obs == b'P':
+        return rw_bin_probs
+@cython.boundscheck(False)
+@cython.wraparound(False)
+@cython.cdivision(True)
+cpdef int regenerate_subsampled_indices(Ushort[:] iin, Ushort[:] iout, int ilen, int stride) nogil:
+    cdef:
+        int i, si
+    # go over the range of all indices within iin
+    for i in range(ilen):
+        # Run over the length of the stride.
+        for si in range(stride):
+            iout[(i*stride)+si] = iin[i] + si
+    return 0
+@cython.boundscheck(False)
+@cython.wraparound(False)
+@cython.cdivision(True)
+cpdef int accumulate_fluxes(int[:] hrows, int[:] hcols, int[:] hobs, weight_t[:] hflux, int[:] hins, Ushort[:] iterations, Py_ssize_t nnz, weight_t[:,:] total_fluxes, int itermax) nogil:
+    cdef:
+        index_t curriter, elem, iiter, ipop
+        long ilem
+    curriter = 0
+    for iter in range(itermax):
+        iiter = iterations[iter]
+        for ilem in range(hins[iiter], hins[iiter+1]):
+            # Not sure if this is necessary, here...
+            if ilem < nnz and iiter+1 < itermax:
+                total_fluxes[hrows[ilem], hcols[ilem]] += hflux[ilem]
+    return 0
+@cython.boundscheck(False)
+@cython.wraparound(False)
+@cython.cdivision(True)
+cpdef int accumulate_obs(int[:] hrows, int[:] hcols, int[:] hobs, weight_t[:] hflux, int[:] hins, Ushort[:] iterations, Py_ssize_t nnz, int[:,:] total_obs, int itermax) nogil:
+    cdef:
+        index_t curriter, elem, iiter, ipop
+        long ilem
+    curriter = 0
+    for iter in range(itermax):
+        iiter = iterations[iter]
+        for ilem in range(hins[iiter], hins[iiter+1]):
+            if ilem < nnz and iiter+1 < itermax:
+                total_obs[hrows[ilem], hcols[ilem]] += hobs[ilem]
+    return 0
+@cython.boundscheck(False)
+@cython.wraparound(False)
+@cython.cdivision(True)
+cpdef int remove_under_obs(weight_t[:,:] flux, int[:,:] obs, int threshold, int nbins) nogil:
+    cdef:
+        int x, y
+    for x in range(nbins):
+        for y in range(nbins):
+            if obs[x,y] < threshold:
+                flux[x,y] = 0
+@cython.boundscheck(False)
+@cython.wraparound(False)
+@cython.cdivision(True)
+cpdef int calc_state_flux(weight_t[:, :] trans_matrix, weight_t[:] bin_probs, long[:] bin_last_state_map, Ushort[:] bin_state_map, int nstates, weight_t[:,:] state_flux, int K_shape) nogil:
+    cdef:
+        int i, j, ii, jj
+    for i in range(K_shape):
+        for j in range(K_shape):
+            ii = bin_last_state_map[i]
+            jj = bin_state_map[j]
+            if jj != nstates:
+                state_flux[ii, jj] += (trans_matrix[i, j] * bin_probs[i])
+    return 0
+@cython.boundscheck(False)
+@cython.wraparound(False)
+@cython.cdivision(True)
+cpdef int steadystate_solve(weight_t[:,:] K, weight_t[:,:] K_mod, weight_t[:] bin_prob, int K_shape, double[:] eigvals, double[:] eigvalsi, double[:,:] eigvecs, double[:,:] WORK, int[:,:] graph, int[:] visited) nogil:
+    cdef:
+        int[:] components
+        int[:,:] _graph
+        double max, eigsum
+        int n_components, components_assignments, largest_component, maxi, x, y, n, INFO, LWORK, i, j
+        # POINTERS
+        int  *_INFO, *_K_shape, *_LWORK
+        double *_K_mod, *_eigvals, *_eigvecs, *_WORK, *_eigvalsi
+    _K_shape = &K_shape
+    _INFO = &INFO
+    _LWORK = &LWORK
+    INFO = 0
+    LWORK = K_shape * 4
+    _K_mod = &K_mod[0,0]
+    _eigvals = &eigvals[0]
+    _eigvecs = &eigvecs[0,0]
+    _eigvalsi = &eigvalsi[0]
+    _WORK = &WORK[0,0]
+    _graph = graph
+    for i in range(K_shape):
+        if visited[i] == 0:
+            visited[i] = 1
+            return_strong_component(K, K_shape, _graph, i, i, visited)
+    n = 0
+    for i in range(K_shape):
+        if graph[i, 0] >= graph[n, 0]:
+            n = i
+    # I suspect this may be giving us issues?
+    #components = _graph[n, :K_shape+1]
+    maxi = 0
+    eigsum = 0.0
+    # This all works!
+    for x in range(K_shape):
+        #i = components[x+1]
+        i = graph[n, x+1]
+        for y in range(K_shape):
+            #j = components[y+1]
+            j = graph[n, y+1]
+            if i != K_shape and j != K_shape:
+                K_mod[i, j] = K[i, j]
+    normalize(K_mod, K_shape)
+    cl.dgeev('N', 'V', _K_shape, _K_mod, _K_shape, _eigvals, _eigvalsi, _eigvecs, _K_shape, _eigvecs, _K_shape, _WORK, _LWORK, _INFO)
+    for x in range(K_shape):
+        if x == 0:
+            max = eigvals[0]
+            maxi = x
+        else:
+            if max < eigvals[x]:
+                max = eigvals[x]
+                maxi = x
+    # We need to go over the whole range and pick out non K_shape elements.
+    # This probably no longer needs to be done, now...
+    for i in range(K_shape):
+        #x = components[i+1]
+        x = graph[n, i+1]
+        if x != K_shape:
+            #eigsum += eigvecs[maxi, components[i+1]]
+            eigsum += eigvecs[maxi, x]
+    for i in range(K_shape):
+        #x = components[i+1]
+        x = graph[n, i+1]
+        if x != K_shape:
+            #bin_prob[components[i+1]] = eigvecs[maxi, components[i+1]]
+            #bin_prob[components[i+1]] /= eigsum
+            bin_prob[x] = eigvecs[maxi, x]
+            bin_prob[x] /= eigsum
+    return 0
+@cython.boundscheck(False)
+@cython.wraparound(False)
+@cython.cdivision(True)
+cpdef int return_strong_component(weight_t[:,:] K, int K_shape, int[:, :] graph, int i, int z, int[:] visited) nogil:
+    cdef:
+        int j, y
+    if graph[z, 0] == 0:
+        graph[z, 0] += 1
+        graph[z, 1] = i
+    for j in xrange(K_shape):
+        if i != j:
+            if K[i, j] > 0.0:
+                # Strongly connected!
+                if visited[j] == 0:
+                    graph[z, 0] += 1
+                    y = graph[z, 0]
+                    graph[z, y] = j
+                    # We only want to call it when we haven't visited it before.
+                    # We don't want to call, THEN modify and check.  Otherwise, we could be doing many calls.
+                    visited[j] = 1
+                    return_strong_component(K, K_shape, graph, j, z, visited)
+    return 0

westpa/core/reweight/matrix.py ADDED Viewed

@@ -0,0 +1,126 @@
+import warnings
+import numpy as np
+import scipy.sparse as sp
+from westpa.core.data_manager import weight_dtype
+from westpa.core import h5io
+# From postanalysis matrix
+from westpa.core.binning import index_dtype
+from westpa.core.reweight import stats_process
+warnings.filterwarnings('ignore', category=DeprecationWarning)
+warnings.filterwarnings('ignore', category=RuntimeWarning)
+warnings.filterwarnings('ignore', category=FutureWarning)
+def calc_stats(bin_assignments, weights, fluxes, populations, trans, mask, sampling_frequency):
+    fluxes.fill(0.0)
+    populations.fill(0.0)
+    trans.fill(0)
+    stats_process(bin_assignments, weights, fluxes, populations, trans, mask, interval=sampling_frequency)
+class FluxMatrix:
+    def w_postanalysis_matrix(self):
+        pi = self.progress.indicator
+        pi.new_operation('Initializing')
+        self.data_reader.open('r')
+        nbins = self.assignments_file.attrs['nbins']
+        state_labels = self.assignments_file['state_labels'][...]
+        # state_map = self.assignments_file['state_map'][...]
+        nstates = len(state_labels)
+        start_iter, stop_iter = self.iter_range.iter_start, self.iter_range.iter_stop  # h5io.get_iter_range(self.assignments_file)
+        iter_count = stop_iter - start_iter
+        nfbins = nbins * nstates
+        flux_shape = (iter_count, nfbins, nfbins)
+        pop_shape = (iter_count, nfbins)
+        h5io.stamp_iter_range(self.output_file, start_iter, stop_iter)
+        bin_populations_ds = self.output_file.create_dataset('bin_populations', shape=pop_shape, dtype=weight_dtype)
+        h5io.stamp_iter_range(bin_populations_ds, start_iter, stop_iter)
+        h5io.label_axes(bin_populations_ds, ['iteration', 'bin'])
+        flux_grp = self.output_file.create_group('iterations')
+        self.output_file.attrs['nrows'] = nfbins
+        self.output_file.attrs['ncols'] = nfbins
+        fluxes = np.empty(flux_shape[1:], weight_dtype)
+        populations = np.empty(pop_shape[1:], weight_dtype)
+        trans = np.empty(flux_shape[1:], np.int64)
+        # Check to make sure this isn't a data set with target states
+        # tstates = self.data_reader.data_manager.get_target_states(0)
+        # if len(tstates) > 0:
+        #    raise ValueError('Postanalysis reweighting analysis does not support WE simulation run under recycling conditions')
+        pi.new_operation('Calculating flux matrices', iter_count)
+        # Calculate instantaneous statistics
+        for iiter, n_iter in enumerate(range(start_iter, stop_iter)):
+            # Get data from the main HDF5 file
+            iter_group = self.data_reader.get_iter_group(n_iter)
+            seg_index = iter_group['seg_index']
+            nsegs, npts = iter_group['pcoord'].shape[0:2]
+            weights = seg_index['weight']
+            # Get bin and traj. ensemble assignments from the previously-generated assignments file
+            assignment_iiter = h5io.get_iteration_entry(self.assignments_file, n_iter)
+            bin_assignments = np.require(
+                self.assignments_file['assignments'][assignment_iiter + np.s_[:nsegs, :npts]], dtype=index_dtype
+            )
+            mask_unknown = np.zeros_like(bin_assignments, dtype=np.uint16)
+            macrostate_iiter = h5io.get_iteration_entry(self.assignments_file, n_iter)
+            macrostate_assignments = np.require(
+                self.assignments_file['trajlabels'][macrostate_iiter + np.s_[:nsegs, :npts]], dtype=index_dtype
+            )
+            # Transform bin_assignments to take macrostate membership into account
+            bin_assignments = nstates * bin_assignments + macrostate_assignments
+            mask_indx = np.where(macrostate_assignments == nstates)
+            mask_unknown[mask_indx] = 1
+            # Calculate bin-to-bin fluxes, bin populations and number of obs transitions
+            calc_stats(bin_assignments, weights, fluxes, populations, trans, mask_unknown, self.sampling_frequency)
+            # Store bin-based kinetics data
+            bin_populations_ds[iiter] = populations
+            # Setup sparse data structures for flux and obs
+            fluxes_sp = sp.coo_matrix(fluxes)
+            trans_sp = sp.coo_matrix(trans)
+            assert fluxes_sp.nnz == trans_sp.nnz
+            flux_iter_grp = flux_grp.create_group('iter_{:08d}'.format(n_iter))
+            flux_iter_grp.create_dataset('flux', data=fluxes_sp.data, dtype=weight_dtype)
+            flux_iter_grp.create_dataset('obs', data=trans_sp.data, dtype=np.int32)
+            flux_iter_grp.create_dataset('rows', data=fluxes_sp.row, dtype=np.int32)
+            flux_iter_grp.create_dataset('cols', data=fluxes_sp.col, dtype=np.int32)
+            flux_iter_grp.attrs['nrows'] = nfbins
+            flux_iter_grp.attrs['ncols'] = nfbins
+            # Do a little manual clean-up to prevent memory explosion
+            del iter_group, weights, bin_assignments
+            del macrostate_assignments
+            pi.progress += 1
+            # Check and save the number of intermediate time points; this will be used to normalize the
+            # flux and kinetics to tau in w_postanalysis_reweight.
+            if self.assignments_file.attrs['subsampled'] is True or self.sampling_frequency == 'iteration':
+                self.output_file.attrs['npts'] = 2
+            else:
+                # self.output_file.attrs['npts'] = npts if self.sampling_frequency == 'timepoint' else 2
+                self.output_file.attrs['npts'] = npts

westpa/core/segment.py ADDED Viewed

@@ -0,0 +1,119 @@
+import math
+import numpy as np
+class Segment:
+    '''A class wrapping segment data that must be passed through the work manager or data manager.
+    Most fields are self-explanatory.  One item worth noting is that a negative parent ID means that
+    the segment starts from the initial state with ID -(segment.parent_id+1)
+    '''
+    SEG_STATUS_UNSET = 0
+    SEG_STATUS_PREPARED = 1
+    SEG_STATUS_COMPLETE = 2
+    SEG_STATUS_FAILED = 3
+    SEG_INITPOINT_UNSET = 0
+    SEG_INITPOINT_CONTINUES = 1
+    SEG_INITPOINT_NEWTRAJ = 2
+    SEG_ENDPOINT_UNSET = 0
+    SEG_ENDPOINT_CONTINUES = 1
+    SEG_ENDPOINT_MERGED = 2
+    SEG_ENDPOINT_RECYCLED = 3
+    statuses = {}
+    initpoint_types = {}
+    endpoint_types = {}
+    status_names = {}
+    initpoint_type_names = {}
+    endpoint_type_names = {}
+    # convenience functions for binning
+    @staticmethod
+    def initial_pcoord(segment):
+        'Return the initial progress coordinate point of this segment.'
+        return segment.pcoord[0]
+    @staticmethod
+    def final_pcoord(segment):
+        'Return the final progress coordinate point of this segment.'
+        return segment.pcoord[-1]
+    def __init__(
+        self,
+        n_iter=None,
+        seg_id=None,
+        weight=None,
+        endpoint_type=None,
+        parent_id=None,
+        wtg_parent_ids=None,
+        pcoord=None,
+        status=None,
+        walltime=None,
+        cputime=None,
+        data=None,
+    ):
+        # NaNs appear sometimes if a WEST program is terminated unexpectedly; replace with zero
+        walltime = 0.0 if walltime is None or math.isnan(walltime) else walltime
+        cputime = 0.0 if cputime is None or math.isnan(cputime) else cputime
+        # the int() and float() calls are required so that new-style string formatting doesn't barf
+        # assuming that the respective fields are actually strings, probably after implicitly
+        # calling __str__() on them.  Not sure if this is a numpy, h5py, or python problem
+        self.n_iter = int(n_iter) if n_iter is not None else None
+        self.seg_id = int(seg_id) if seg_id is not None else None
+        self.status = int(status) if status is not None else None
+        self.parent_id = int(parent_id) if parent_id is not None else None
+        self.endpoint_type = int(endpoint_type) if endpoint_type else self.SEG_ENDPOINT_UNSET
+        self.weight = float(weight) if weight is not None else None
+        self.wtg_parent_ids = set(wtg_parent_ids or ())
+        self.pcoord = np.asarray(pcoord) if pcoord is not None else None
+        self.walltime = walltime
+        self.cputime = cputime
+        self.data = data if data else {}
+    def __repr__(self):
+        return '<%s(%s) n_iter=%r seg_id=%r weight=%r parent_id=%r wtg_parent_ids=%r pcoord[0]=%r pcoord[-1]=%r>' % (
+            self.__class__.__name__,
+            hex(id(self)),
+            self.n_iter,
+            self.seg_id,
+            self.weight,
+            self.parent_id,
+            tuple(self.wtg_parent_ids or ()),
+            self.pcoord[0] if self.pcoord is not None else None,
+            self.pcoord[-1] if self.pcoord is not None else None,
+        )
+    @property
+    def initpoint_type(self):
+        if self.parent_id < 0:
+            return Segment.SEG_INITPOINT_NEWTRAJ
+        else:
+            return Segment.SEG_INITPOINT_CONTINUES
+    @property
+    def initial_state_id(self):
+        if self.parent_id < 0:
+            return -(self.parent_id + 1)
+        else:
+            return None
+    status_text = property((lambda s: s.status_names[s.status]))
+    endpoint_type_text = property((lambda s: s.endpoint_type_names[s.endpoint_type]))
+Segment.statuses.update({_attr: getattr(Segment, _attr) for _attr in dir(Segment) if _attr.startswith('SEG_STATUS_')})
+Segment.initpoint_types.update({_attr: getattr(Segment, _attr) for _attr in dir(Segment) if _attr.startswith('SEG_INITPOINT_')})
+Segment.endpoint_types.update({_attr: getattr(Segment, _attr) for _attr in dir(Segment) if _attr.startswith('SEG_ENDPOINT_')})
+Segment.status_names.update({getattr(Segment, _attr): _attr for _attr in dir(Segment) if _attr.startswith('SEG_STATUS_')})
+Segment.initpoint_type_names.update(
+    {getattr(Segment, _attr): _attr for _attr in dir(Segment) if _attr.startswith('SEG_INITPOINT_')}
+)
+Segment.endpoint_type_names.update({getattr(Segment, _attr): _attr for _attr in dir(Segment) if _attr.startswith('SEG_ENDPOINT_')})