RubyGems - xpflow - Versions diffs - 0.1b → 0.1c - Mend

xpflow 0.1b → 0.1c

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (7) hide show

data/bin/xpflow CHANGED Viewed

@@ -47,12 +47,26 @@ def usage
 end
 def use(*args)
-    # TODO: this should be more sophisticated
-    # for now it's so so
+    # obsolete, but backwards compatible 'use'
+    return import(*args)
+end
+def import_via_name(name)
+    # TODO: it should be more sophisticated
+    name = name.to_s
+    begin
+        Kernel.load("./#{name}")
+    rescue LoadError
+        Kernel.require("xpflow/exts/#{name}_use")
+    end
+end
-    args.each do |lib|
-        require "xpflow/exts/#{lib.to_s}_use"
+def import(*args)
+    if args.length == 0
+        raise "Import requires a file or a library"
+    end
+    args.each do |it|
+        import_via_name(it)
     end
 end

data/lib/xpflow/cmdline.rb CHANGED Viewed

@@ -131,12 +131,12 @@ module XPFlow
                     @config[:labels] += labels.split(',').map { |x| x.downcase.to_sym }
                 end
-                opts.on("-I", "--ignore-checkpoints", "Ignore automatically saved checkpoints") do
+                opts.on("-i", "--ignore-checkpoints", "Ignore automatically saved checkpoints") do
                     @config[:ignore_checkpoints] = true
                 end
-                # opts.on("-C", "--checkpoint NAME", "Jump to checkpoint NAME (if exists)") do |name|
-                #     @config[:checkpoint] = name
-                # end
+                opts.on("-c", "--checkpoint NAME", "Jump to checkpoint NAME (if exists)") do |name|
+                    @config[:checkpoint] = name
+                end
                 # opts.on("-c", "--list-checkpoints", "List available checkpoints") do
                 #    @config[:instead] += [ RunInfo.new(:list_checkpoints) ]
                 # end

data/lib/xpflow/data.rb CHANGED Viewed

@@ -48,58 +48,87 @@ module XPFlow
             return average_stddev().last
         end
-        #Credit for cdf_inverse : http://home.online.no/~pjacklam/notes/invnorm/
+        # START OF DISTRIBUTIONS
+        # Credit for cdf_inverse : http://home.online.no/~pjacklam/notes/invnorm/
         # inverse standard normal cumulative distribution function
-        def cdf_inverse(p)
-          a = [0, -3.969683028665376e+01, 2.209460984245205e+02, -2.759285104469687e+02, 1.383577518672690e+02, -3.066479806614716e+01, 2.506628277459239e+00]
-          b = [0, -5.447609879822406e+01, 1.615858368580409e+02, -1.556989798598866e+02, 6.680131188771972e+01, -1.328068155288572e+01]
-          c = [0, -7.784894002430293e-03, -3.223964580411365e-01, -2.400758277161838e+00, -2.549732539343734e+00, 4.374664141464968e+00, 2.938163982698783e+00]
-          d = [0, 7.784695709041462e-03, 3.224671290700398e-01, 2.445134137142996e+00, 3.754408661907416e+00]
-          #Define break-points.
-          p_low  = 0.02425
-          p_high = 1.0 - p_low
-          x = 0.0
-          q = 0.0
-          #Rational approximation for lower region.
-          if 0.0 < p && p < p_low
-            q = Math.sqrt(-2.0*Math.log(p))
-            x = (((((c[1]*q+c[2])*q+c[3])*q+c[4])*q+c[5])*q+c[6]) / ((((d[1]*q+d[2])*q+d[3])*q+d[4])*q+1.0)
-            #Rational approximation for central region.
-          elsif p_low <= p && p <= p_high
-            q = p - 0.5
-            r = q*q
-            x = (((((a[1]*r+a[2])*r+a[3])*r+a[4])*r+a[5])*r+a[6])*q / (((((b[1]*r+b[2])*r+b[3])*r+b[4])*r+b[5])*r+1.0)
-            #Rational approximation for upper region.
-          elsif p_high < p && p < 1.0
-            q = Math.sqrt(-2.0*Math.log(1.0-p))
-            x = -(((((c[1]*q+c[2])*q+c[3])*q+c[4])*q+c[5])*q+c[6]) / ((((d[1]*q+d[2])*q+d[3])*q+d[4])*q+1.0)
-          end
-          #The relative error of the approximation has
-          #absolute value less than 1.15 × 10−9.  One iteration of
-          #Halley’s rational method (third order) gives full machine precision.
-          if 0 < p && p < 1
-            e = 0.5 * Math.erfc(-x/Math.sqrt(2.0)) - p
-            u = e * Math.sqrt(2.0*Math::PI) * Math.exp((x**2.0)/2.0)
-            x = x - u/(1.0 + x*u/2.0)
-          end
-          x
-        end
-        def minimal_sample_prel(prec,confidance)
-          minimal_sample_both(prec,nil,confidance)
-        end
-        def minimal_sample_pabs(prec,confidance)
-          minimal_sample_both(nil,prec,condidance)
-        end
-        #vectors is values and prec and confidence is in percentage
-        def minimal_sample_both(prec_rel,prec,confidence)
-          avg = average
-          prec = prec_rel.nil? ? prec : avg*prec_rel
-          critical_value=cdf_inverse((1-confidence)/2)
-          ((critical_value*stddev() / prec) ** 2).to_i + 1
+        def self.cdf_inverse(p)
+            a = [0, -3.969683028665376e+01, 2.209460984245205e+02, -2.759285104469687e+02, 1.383577518672690e+02, -3.066479806614716e+01, 2.506628277459239e+00]
+            b = [0, -5.447609879822406e+01, 1.615858368580409e+02, -1.556989798598866e+02, 6.680131188771972e+01, -1.328068155288572e+01]
+            c = [0, -7.784894002430293e-03, -3.223964580411365e-01, -2.400758277161838e+00, -2.549732539343734e+00, 4.374664141464968e+00, 2.938163982698783e+00]
+            d = [0, 7.784695709041462e-03, 3.224671290700398e-01, 2.445134137142996e+00, 3.754408661907416e+00]
+            #Define break-points.
+            p_low  = 0.02425
+            p_high = 1.0 - p_low
+            x = 0.0
+            q = 0.0
+            #Rational approximation for lower region.
+            if 0.0 < p && p < p_low
+                q = Math.sqrt(-2.0*Math.log(p))
+                x = (((((c[1]*q+c[2])*q+c[3])*q+c[4])*q+c[5])*q+c[6]) / ((((d[1]*q+d[2])*q+d[3])*q+d[4])*q+1.0)
+                #Rational approximation for central region.
+            elsif p_low <= p && p <= p_high
+                q = p - 0.5
+                r = q*q
+                x = (((((a[1]*r+a[2])*r+a[3])*r+a[4])*r+a[5])*r+a[6])*q / (((((b[1]*r+b[2])*r+b[3])*r+b[4])*r+b[5])*r+1.0)
+                #Rational approximation for upper region.
+            elsif p_high < p && p < 1.0
+                q = Math.sqrt(-2.0*Math.log(1.0-p))
+                x = -(((((c[1]*q+c[2])*q+c[3])*q+c[4])*q+c[5])*q+c[6]) / ((((d[1]*q+d[2])*q+d[3])*q+d[4])*q+1.0)
+            end
+            #The relative error of the approximation has
+            #absolute value less than 1.15 × 10−9.  One iteration of
+            #Halley’s rational method (third order) gives full machine precision.
+            if 0 < p && p < 1
+                e = 0.5 * Math.erfc(-x/Math.sqrt(2.0)) - p
+                u = e * Math.sqrt(2.0*Math::PI) * Math.exp((x**2.0)/2.0)
+                x = x - u/(1.0 + x*u/2.0)
+            end
+            return x
+        end
+        # computes confidence interval, assuming that
+        # the number of measures is large enough
+        # to be approximated with CLT
+        # prec is ABSOLUTE (here and below)
+        def _compute_dist(prec, conf, cvalue)
+            m, s = average_stddev()
+            d = (cvalue * s).to_f / (@values.length ** 0.5)
+            sample = ((cvalue * s / prec) ** 2).to_i + 1
+            return {
+                :interval => [ m - d, m + d ],
+                :d => d,
+                :sample => sample
+            }
+        end
+        def _dist(name, prec, conf)
+            r = case name
+                when :n then _dist_n(prec, conf)
+                when :t then _dist_t(prec, conf)
+                else
+                    raise "Unknown distribution: #{name}"
+                end
+            return r
+        end
+        def _dist_n(prec, conf)
+            cvalue = ValueData.cdf_inverse((1 + conf) * 0.5)
+            return _compute_dist(prec, conf, cvalue)
+        end
+        def confidence_interval_n(conf)
+            return _dist_n(1.0, conf)[:interval]
+        end
+        # computes the minimal sample size
+        def minimal_sample_n(prec, conf)
+            return _dist_n(prec, conf)[:sample]
         end
         TSTUDENT = [
@@ -108,33 +137,31 @@ module XPFlow
             2.074, 2.069, 2.064, 2.060, 2.056, 2.052, 2.048, 2.045, 2.042, 2.021, 2.009,
             2.000, 1.990, 1.984, 1.980, 1.960 ]
-        def confidence_interval
-            if size() >= TSTUDENT.length
-                factor = TSTUDENT[-1]
-            else
-                factor = TSTUDENT[size()]
-            end
-            m, s = average_stddev()
-            d = (factor * s).to_f / (@values.length ** 0.5)
-            return [m - d, m + d]
+        def _get_tstudent_factor
+            n = size()
+            raise "size of sample must be positive" if n <= 0
+            return (n < TSTUDENT.length) ? TSTUDENT[n] : TSTUDENT[-1]
         end
-        def confidence_precision
-            a, b = confidence_interval()
-            return (b - a) * 0.5
+        def _dist_t(prec, conf)
+            cvalue = _get_tstudent_factor()
+            return _compute_dist(prec, conf, cvalue)
         end
-        def confidence_ratio
-            # provides conf. as a percentage around the estimated mean value
-            prec = confidence_precision()
-            mean = average().abs
-            return (prec / mean)
+        # computes confidence interval, assuming that
+        # each measure is normal; therefore their
+        # average is t-student
+        def confidence_interval_t(conf)
+            # TODO: confidence is ignored
+            return _dist_t(1.0, conf)[:interval]
         end
-        def conf_ratio
-            return confidence_ratio
+        def minimal_sample_t(prec, conf)
+            return _dist_t(prec, conf)[:sample]
         end
+        # END OF DISTRIBUTIONS
         def map(&block)
             arr = @values.map(&block)
             return ValueData.new(arr)

data/lib/xpflow/exts/g5k.rb CHANGED Viewed

@@ -204,8 +204,6 @@ module XPFlow; module G5K
         def get_sites
             sites = get_items('sites').list
-            # TODO: temporary fix for two sites
-            sites = sites.select { |x| ! [ "Bordeaux", "Reims" ].include?(x['name']) }
             return sites
         end

data/lib/xpflow/nodes.rb CHANGED Viewed

@@ -458,7 +458,8 @@ module XPFlow
             :bootstrap_taktuk, :simple_node, :node_range, :taktuk_raw, :test_connectivity,
             :nodes_from_file, :nodes_from_result, :distribute, :chain_copy, :ssh_key,
             :nodes_from_machinefile, :g5k_deploy_keys, :localhost, :file_consistency,
-            :ping_localhost, :ping_node, :g5k_reserve_nodes
+            :ping_localhost, :ping_node, :g5k_reserve_nodes,
+            :g5k_sites
         def setup
             nil
@@ -975,21 +976,30 @@ module XPFlow
             return true
         end
-        def g5k_reserve_nodes(*args)
-            p = proxy()
+        def with_g5k_lib(p)
             lib = G5K::Library.new
             lib.logging = proc { |x| p.engine.log(x) }
-            lib.proxy = proxy
-            return lib.reserve_nodes(*args)
+            lib.proxy = p
+            return yield(lib)
+        end
+        def g5k_reserve_nodes(*args)
+            with_g5k_lib(proxy) do |lib|
+                lib.reserve_nodes(*args)
+            end
+        end
+        def g5k_sites(*args)
+            with_g5k_lib(proxy) do |lib|
+                lib.sites()
+            end
         end
         def g5k_get_avail(opts = {})
-            p = proxy()
-            lib = G5K::Library.new
-            lib.logging = proc { |x| p.engine.log(x) }
-            lib.proxy = proxy
-            job = lib.pick_reservation(opts)
-            return job
+            with_g5k_lib(proxy) do |lib|
+                lib.pick_reservation(opts)
+            end
         end
         def nodes_file(user, filepath)

data/lib/xpflow/stdlib.rb CHANGED Viewed

@@ -84,8 +84,9 @@ module XPFlow
             return result
         end
-        def value(v)
-            return v
+        def value(*args)
+            return args.first if args.length == 1
+            return args
         end
         def code(*args)
@@ -249,9 +250,9 @@ module XPFlow
     class DataLibrary < SyncedActivityLibrary
         activities :store, :data, :avg, :sum, :stddev, :gauss,
-            :confidence_precision, :confidence_interval, :save_yaml,
-            :data_vector, :conf_precision, :data_append, :data_push,
-            :run_later, :get_of, :minimal_sample, :minimal_sample_enough
+            :conf_interval, :save_yaml,
+            :data_vector, :data_push,
+            :run_later, :get_of, :minimal_sample, :sample_enough
         def data_vector(values = nil)
             return ValueData.new(values)
@@ -318,10 +319,6 @@ module XPFlow
             return m + s * Math.cos(2*Math::PI*x) * p
         end
-        def data_append(data, x)
-            return data.append(x)
-        end
         def data_push(data, x)
             data.push(x)
         end
@@ -353,13 +350,54 @@ module XPFlow
         def save_yaml(filename, obj)
             IO.write(filename, obj.to_yaml)
         end
-        def minimal_sample_enough(name,opts={})
-          minimal_sample(name,opts)<name.size
+        # opts:
+        #  :dist => distribution type (default: :normal, also: :n, :t, :tstudent)
+        #  :conf => confidence (default: 0.95)
+        #  :rel => relative precision in percents (default: 0.1)
+        #  :abs => absolute precision (e.g., 5)
+        def _parse_sample_opts(v, _opts)
+            opts = { :conf => 0.95, :rel => 0.1, :abs => nil, :dist => :n }.merge(_opts)
+            dists = { :n => :n, :normal => :n, :t => :t, :tstudent => :t }
+            opts[:dist] = dists[opts[:dist]]
+            raise "Wrong confidence" if (opts[:conf] <= 0.0 or opts[:conf] >= 1.0)
+            if opts[:abs].nil?
+                opts[:abs] = v.average() * opts[:rel]
+            end
+            opts[:info] = v._dist(opts[:dist], opts[:abs], opts[:conf])
+            return opts
         end
-        def minimal_sample(name,opts={})
-          opts.merge({:conf=>0.95,:abs=>1})
-          name.minimal_sample_both(opts[:rel],opts[:abs],opts[:conf])
+        def flatten_data(x)
+            if x.is_a?(Array)
+                return ValueData.new(x)
+            elsif x.is_a?(ValueData)
+                return x
+            else
+                raise "Wrong data type: #{x.class}"
+            end
         end
+        def sample_enough(v, opts = {})
+            v = flatten_data(v)
+            opts = _parse_sample_opts(v, opts)
+            info = opts[:info]
+            return info[:d] <= opts[:abs]
+        end
+        def minimal_sample(v, opts = {})
+            v = flatten_data(v)
+            opts = _parse_sample_opts(v, opts)
+            return opts[:info][:sample]
+        end
+        def conf_interval(v, opts = {})
+            v = flatten_data(v)
+            opts = _parse_sample_opts(v, opts)
+            return opts[:info][:interval]
+        end
     end
     class TestLibrary < SyncedActivityLibrary

metadata CHANGED Viewed

@@ -1,7 +1,7 @@
 --- !ruby/object:Gem::Specification
 name: xpflow
 version: !ruby/object:Gem::Version
-  version: 0.1b
+  version: 0.1c
   prerelease: 3
 platform: ruby
 authors: