RubyGems - CooCoo - Versions diffs - 0.1.0 - Mend

CooCoo 0.1.0

Files changed (105) hide show

checksums.yaml +7 -0
data/.gitignore +16 -0
data/CooCoo.gemspec +47 -0
data/Gemfile +4 -0
data/Gemfile.lock +88 -0
data/README.md +123 -0
data/Rakefile +81 -0
data/bin/cuda-dev-info +25 -0
data/bin/cuda-free +28 -0
data/bin/cuda-free-trend +7 -0
data/bin/ffi-gen +267 -0
data/bin/spec_runner_html.sh +42 -0
data/bin/trainer +198 -0
data/bin/trend-cost +13 -0
data/examples/char-rnn.rb +405 -0
data/examples/cifar/cifar.rb +94 -0
data/examples/img-similarity.rb +201 -0
data/examples/math_ops.rb +57 -0
data/examples/mnist.rb +365 -0
data/examples/mnist_classifier.rb +293 -0
data/examples/mnist_dream.rb +214 -0
data/examples/seeds.rb +268 -0
data/examples/seeds_dataset.txt +210 -0
data/examples/t10k-images-idx3-ubyte +0 -0
data/examples/t10k-labels-idx1-ubyte +0 -0
data/examples/train-images-idx3-ubyte +0 -0
data/examples/train-labels-idx1-ubyte +0 -0
data/ext/buffer/Rakefile +50 -0
data/ext/buffer/buffer.pre.cu +727 -0
data/ext/buffer/matrix.pre.cu +49 -0
data/lib/CooCoo.rb +1 -0
data/lib/coo-coo.rb +18 -0
data/lib/coo-coo/activation_functions.rb +344 -0
data/lib/coo-coo/consts.rb +5 -0
data/lib/coo-coo/convolution.rb +298 -0
data/lib/coo-coo/core_ext.rb +75 -0
data/lib/coo-coo/cost_functions.rb +91 -0
data/lib/coo-coo/cuda.rb +116 -0
data/lib/coo-coo/cuda/device_buffer.rb +240 -0
data/lib/coo-coo/cuda/device_buffer/ffi.rb +109 -0
data/lib/coo-coo/cuda/error.rb +51 -0
data/lib/coo-coo/cuda/host_buffer.rb +117 -0
data/lib/coo-coo/cuda/runtime.rb +157 -0
data/lib/coo-coo/cuda/vector.rb +315 -0
data/lib/coo-coo/data_sources.rb +2 -0
data/lib/coo-coo/data_sources/xournal.rb +25 -0
data/lib/coo-coo/data_sources/xournal/bitmap_stream.rb +197 -0
data/lib/coo-coo/data_sources/xournal/document.rb +377 -0
data/lib/coo-coo/data_sources/xournal/loader.rb +144 -0
data/lib/coo-coo/data_sources/xournal/renderer.rb +101 -0
data/lib/coo-coo/data_sources/xournal/saver.rb +99 -0
data/lib/coo-coo/data_sources/xournal/training_document.rb +78 -0
data/lib/coo-coo/data_sources/xournal/training_document/constants.rb +15 -0
data/lib/coo-coo/data_sources/xournal/training_document/document_maker.rb +89 -0
data/lib/coo-coo/data_sources/xournal/training_document/document_reader.rb +105 -0
data/lib/coo-coo/data_sources/xournal/training_document/example.rb +37 -0
data/lib/coo-coo/data_sources/xournal/training_document/sets.rb +76 -0
data/lib/coo-coo/debug.rb +8 -0
data/lib/coo-coo/dot.rb +129 -0
data/lib/coo-coo/drawing.rb +4 -0
data/lib/coo-coo/drawing/cairo_canvas.rb +100 -0
data/lib/coo-coo/drawing/canvas.rb +68 -0
data/lib/coo-coo/drawing/chunky_canvas.rb +101 -0
data/lib/coo-coo/drawing/sixel.rb +214 -0
data/lib/coo-coo/enum.rb +17 -0
data/lib/coo-coo/from_name.rb +58 -0
data/lib/coo-coo/fully_connected_layer.rb +205 -0
data/lib/coo-coo/generation_script.rb +38 -0
data/lib/coo-coo/grapher.rb +140 -0
data/lib/coo-coo/image.rb +286 -0
data/lib/coo-coo/layer.rb +67 -0
data/lib/coo-coo/layer_factory.rb +26 -0
data/lib/coo-coo/linear_layer.rb +59 -0
data/lib/coo-coo/math.rb +607 -0
data/lib/coo-coo/math/abstract_vector.rb +121 -0
data/lib/coo-coo/math/functions.rb +39 -0
data/lib/coo-coo/math/interpolation.rb +7 -0
data/lib/coo-coo/network.rb +264 -0
data/lib/coo-coo/neuron.rb +112 -0
data/lib/coo-coo/neuron_layer.rb +168 -0
data/lib/coo-coo/option_parser.rb +18 -0
data/lib/coo-coo/platform.rb +17 -0
data/lib/coo-coo/progress_bar.rb +11 -0
data/lib/coo-coo/recurrence/backend.rb +99 -0
data/lib/coo-coo/recurrence/frontend.rb +101 -0
data/lib/coo-coo/sequence.rb +187 -0
data/lib/coo-coo/shell.rb +2 -0
data/lib/coo-coo/temporal_network.rb +291 -0
data/lib/coo-coo/trainer.rb +21 -0
data/lib/coo-coo/trainer/base.rb +67 -0
data/lib/coo-coo/trainer/batch.rb +82 -0
data/lib/coo-coo/trainer/batch_stats.rb +27 -0
data/lib/coo-coo/trainer/momentum_stochastic.rb +59 -0
data/lib/coo-coo/trainer/stochastic.rb +47 -0
data/lib/coo-coo/transformer.rb +272 -0
data/lib/coo-coo/vector_layer.rb +194 -0
data/lib/coo-coo/version.rb +3 -0
data/lib/coo-coo/weight_deltas.rb +23 -0
data/prototypes/convolution.rb +116 -0
data/prototypes/linear_drop.rb +51 -0
data/prototypes/recurrent_layers.rb +79 -0
data/www/images/screamer.png +0 -0
data/www/images/screamer.xcf +0 -0
data/www/index.html +82 -0
metadata +373 -0

@@ -0,0 +1,293 @@
+#!/bin/env ruby
+require 'fileutils'
+require 'mnist'
+require 'ostruct'
+require 'coo-coo'
+require 'coo-coo/image'
+require 'coo-coo/convolution'
+require 'coo-coo/neuron_layer'
+require 'coo-coo/subnet'
+require 'coo-coo/drawing/sixel'
+require 'colorize'
+def backup(path)
+  if File.exists?(path)
+    backup = path.to_s + "~"
+    if File.exists?(backup)
+      File.delete(backup)
+    end
+    FileUtils.copy(path, backup)
+  end
+end
+options = OpenStruct.new
+options.examples = 0
+options.epochs = 1
+options.num_tests = 10
+options.start_tests_at = 0
+options.rotations = 8
+options.max_rotation = 90.0
+options.num_translations = 1
+options.translate_dx = 0
+options.translate_dy = 0
+options.hidden_layers = nil
+options.hidden_size = 128
+options.activation_function = CooCoo.default_activation
+options.trainer = 'Stochastic'
+options.softmax = false
+options.convolution = nil
+options.conv_step = 8
+options.stacked_convolution = false
+options.test_images_path = MNist::TEST_IMAGES_PATH
+options.test_labels_path = MNist::TEST_LABELS_PATH
+opts = CooCoo::OptionParser.new do |o|
+  o.on('-h', '--help') do
+    puts(o)
+    if options.trainer
+      t = CooCoo::Trainer.from_name(options.trainer)
+      raise NameError.new("Unknown trainer #{options.trainer}") unless t
+      opts, _ = t.options
+      puts(opts)
+    end
+    exit
+  end
+  o.on('--sixel') do
+    options.sixel = true
+  end
+  o.on('-m', '--model PATH') do |path|
+    options.model_path = Pathname.new(path)
+    options.binary_blob = File.extname(options.model_path) == '.bin'
+  end
+  o.on('--binary') do
+    options.binary_blob = true
+  end
+  o.on('-t', '--train NUMBER', 'train for number of epochs') do |n|
+    options.train = true
+    options.epochs = n.to_i
+  end
+  o.on('-e', '--examples NUMBER') do |n|
+    options.examples = n.to_i
+  end
+  o.on('-p', '--predict NUMBER') do |n|
+    options.num_tests = n.to_i
+  end
+  o.on('-s', '--skip NUMBER') do |n|
+    options.start_tests_at = n.to_i
+  end
+  o.on('-r', '--rotations NUMBER') do |n|
+    options.rotations = n.to_i
+  end
+  o.on('-a', '--angle NUMBER') do |n|
+    options.max_rotation = n.to_f
+  end
+  o.on('--num-translations NUMBER') do |n|
+    options.num_translations = n.to_i
+  end
+  o.on('--delta-x NUMBER') do |dx|
+    options.translate_dx = dx.to_f
+  end
+  o.on('--delta-y NUMBER') do |dy|
+    options.translate_dy = dy.to_f
+  end
+  o.on('-l', '--hidden-layers NUMBER') do |n|
+    options.hidden_layers = n.to_i
+  end
+  o.on('--hidden-size NUMBER') do |n|
+    options.hidden_size = n.to_i
+  end
+  o.on('-f', '--activation-func FUNC') do |func|
+    options.activation_function = CooCoo::ActivationFunctions.from_name(func)
+  end
+  o.on('--trainer NAME') do |name|
+    options.trainer = name
+  end
+  o.on('--softmax') do
+    options.softmax = true
+  end
+  o.on('--convolution') do
+    options.convolution = true
+  end
+  o.on('--convolution-step NUMBER') do |n|
+    n = n.to_i
+    raise ArgumentError.new("The convolution step must be >0.") if n <= 0
+    options.conv_step = n
+  end
+end
+argv = opts.parse!(ARGV)
+max_rad = options.max_rotation.to_f * Math::PI / 180.0
+trainer = nil
+trainer_options = nil
+if options.trainer
+  trainer = CooCoo::Trainer.from_name(options.trainer)
+  raise NameError.new("Unknown trainer #{options.trainer}") unless trainer
+  t_opts, trainer_options = trainer.options
+  argv = t_opts.parse!(argv)
+end
+raise ArgumentError.new("The convolution step must be >=8 when stacking convolutions.") if options.conv_step < 8
+puts("Loading MNist data")
+data = MNist::DataStream.new
+net = CooCoo::Network.new
+if options.model_path && File.exists?(options.model_path)
+  puts("Loading #{options.model_path}")
+  if options.binary_blob
+    net = Marshal.load(File.read(options.model_path))
+  else
+    net.load!(options.model_path)
+  end
+else
+  area = data.width * data.height
+  if options.convolution
+    l = CooCoo::Convolution::BoxLayer.new(data.width, data.height, options.conv_step, options.conv_step, CooCoo::Layer.new(16, 4, options.activation_function), 4, 4, 2, 2)
+    net.layer(l)
+    area = l.size
+  end
+  # net.layer(CooCoo::Layer.new(area, 50, options.activation_function))
+  # net.layer(CooCoo::Layer.new(50, 20, , options.activation_function))
+  # net.layer(CooCoo::Layer.new(20, 10, options.activation_function))
+  #net.layer(CooCoo::Layer.new(area, 10, options.activation_function))
+  if options.hidden_layers
+    net.layer(CooCoo::Layer.new(area, options.hidden_size, options.activation_function))
+    if options.hidden_layers > 2
+      (options.hidden_layers - 2).times do
+        net.layer(CooCoo::Layer.new(options.hidden_size, options.hidden_size, options.activation_function))
+      end
+    end
+    net.layer(CooCoo::Layer.new(options.hidden_size, 10, options.activation_function))
+  else
+    net.layer(CooCoo::Layer.new(area, area / 4, options.activation_function))
+    net.layer(CooCoo::Layer.new(area / 4, 10, options.activation_function))
+  end
+  #net.layer(CooCoo::Convolution::BoxLayer.new(7, 7, CooCoo::Layer.new(16, 4), 4, 4, 2, 2))
+  #net.layer(CooCoo::Layer.new(14 * 14, 10))
+  if options.softmax
+    net.layer(CooCoo::LinearLayer.new(10, CooCoo::ActivationFunctions::ShiftedSoftMax.instance))
+  end
+end
+puts("Net ready:")
+puts("\tAge: #{net.age}")
+puts("\tActivation: #{net.activation_function}")
+puts("\tInputs: #{net.num_inputs}")
+puts("\tOutputs: #{net.num_outputs}")
+puts("\tLayers: #{net.num_layers}")
+net.layers.each_with_index do |l, i|
+  puts("\t\t#{i}\t#{l.num_inputs}\t#{l.size}\t#{l.class}")
+end
+$stdout.flush
+if options.train
+  if options.model_path
+    backup(options.model_path)
+  end
+  data_r = MNist::DataStream::Rotator.new(data, options.rotations, max_rad, false)
+  data_t = MNist::DataStream::Translator.new(data_r, options.num_translations, options.translate_dx, options.translate_dy, false)
+  training_set = MNist::TrainingSet.new(data_t).each
+  ts = training_set.each
+  if options.examples > 0
+    ts = ts.first(options.examples * options.rotations)
+  end
+  if options.epochs > 1
+    ts = ts.cycle(options.epochs)
+  end
+  nex = options.examples * options.rotations * options.num_translations
+  nex = "all" if nex == 0
+  puts("Training #{nex} examples in #{trainer_options.batch_size} sized batches at a rate of #{trainer_options.learning_rate} with #{trainer.name}.")
+  trainer.train({ network: net,
+                  data: ts
+                }.merge(trainer_options.to_h)) do |stats|
+    avg_err = stats.average_loss
+    raise "Cost went to NAN" if avg_err.nan?
+    puts("Cost\t#{avg_err.average}")
+    puts("  Magnitude\t#{avg_err.magnitude}")
+    if options.model_path
+      puts("Batch #{stats.batch} took #{stats.total_time} seconds")
+      puts("Saving to #{options.model_path}")
+      if options.binary_blob
+        File.open(options.model_path, 'wb') do |f|
+          f.write(Marshal.dump(net))
+        end
+      else
+        net.save(options.model_path)
+      end
+    end
+    $stdout.flush
+  end
+end
+CHECKMARK = "\u2714"
+CROSSMARK = "\u2718"
+puts("Trying the training images")
+errors = Array.new(options.num_tests, 0)
+data = MNist::DataStream.new(options.test_labels_path, options.test_images_path)
+data_r = MNist::DataStream::Rotator.new(data.each.
+                                          drop(options.start_tests_at).
+                                          first(options.num_tests),
+                                        1, max_rad, true)
+data_t = MNist::DataStream::Translator.new(data_r, 1, options.translate_dx, options.translate_dy, true)
+data_t.
+  each_with_index do |example, i|
+  output, hidden_state = net.predict(CooCoo::Vector[example.pixels, data.width * data.height, 0] / 256.0, Hash.new, true)
+  max_outputs = output.each_with_index.sort.reverse
+  max_output = max_outputs.first[1]
+  passed = example.label == max_output
+  color = passed ? :green : :red
+  mark = passed ? CHECKMARK : CROSSMARK
+  errors[i] = 1.0 unless passed
+  sixel = if options.sixel
+            " for " + CooCoo::Drawing::Sixel.to_string do |s|
+      16.times { |i| c = i / 16.0 * 100; s.set_color(i, c, c, c) }
+      s.from_array(CooCoo::Vector[example.each_pixel.collect.to_a] * 16.0 / 256.0, 28, 28)
+    end
+          else
+            "\n"
+          end
+  puts("#{mark.send(color)} #{i.to_s.send(color)}\tExpecting: #{example.label}#{sixel}\tAngle: #{example.angle * 180.0 / Math::PI}\n\tOffset: #{example.offset_x} #{example.offset_y}\n\tGot: #{max_output}\t#{max_output == example.label}\n\tOutputs: #{output}\n\tBest guesses: #{max_outputs.first(3).inspect}")
+  if example.label != max_output
+    puts("#{example.to_ascii}")
+  end
+end
+puts("Errors: #{errors.each.sum / options.num_tests.to_f * 100.0}% (#{errors.each.sum}/#{options.num_tests})")

data/examples/mnist_dream.rb ADDED

@@ -0,0 +1,214 @@
+require 'coo-coo'
+require 'ostruct'
+require 'coo-coo/drawing/sixel'
+require 'colorize'
+$use_color = true
+PixelValues = ' -+%X#'
+ColorValues = [ :black, :red, :green, :blue, :magenta, :white ]
+def char_for_pixel(p)
+  PixelValues[(p * (PixelValues.length - 1)).to_i] || PixelValues[0]
+end
+def color_for_pixel(p)
+  ColorValues[(p * (ColorValues.length - 1)).to_i] || ColorValues[0]
+end
+def output_to_ascii(output)
+  output = output.minmax_normalize(true)
+  s = ""
+  w = Math.sqrt(output.size).to_i
+  w.times do |y|
+    w.times do |x|
+      v = output[x + y * w]
+      v = 1.0 if v > 1.0
+      v = 0.0 if v < 0.0
+      c = char_for_pixel(v)
+      c = c.colorize(color_for_pixel(v)) if $use_color
+      s += c
+    end
+    s += "\n"
+  end
+  s
+end
+def output_to_sixel(output)
+  output = output.minmax_normalize(true)
+  CooCoo::Drawing::Sixel.to_string do |s|
+    16.times { |i| c = i / 16.0 * 100; s.set_color(i, c, c, c) }
+    w = Math.sqrt(output.size).to_i
+    s.from_array(output * 16, w, w)
+  end
+end
+def sgd(opts)
+  f = opts.fetch(:f)
+  cost = opts.fetch(:cost)
+  loss = opts.fetch(:loss)
+  update = opts.fetch(:update)
+  #on_batch = opts.fetch(:on_batch)
+  status = opts.fetch(:status)
+  epochs = opts.fetch(:epochs, 1)
+  rate = opts.fetch(:rate)
+  verbose = opts.fetch(:verbose, false)
+  status_time = opts.fetch(:status_time, Float::INFINITY)
+  last_time = Time.now
+  last_deltas = 0.0 # CooCoo::Vector.zeros(28 * 28)
+  c = nil
+  output = nil
+  deltas = nil
+  epochs.times do |e|
+    output = f.call()
+    c = cost.call(*output)
+    deltas = loss.call(c, *output) * rate
+    update.call(deltas, last_deltas * rate)
+    last_deltas = deltas
+    dt = Time.now - last_time
+    if status && verbose && dt > status_time
+      status.call({ dt: dt,
+                    epoch: e,
+                    output: output,
+                    cost: c,
+                    deltas: deltas
+                  })
+      last_time = Time.now
+    end
+  end
+  if status && verbose
+    status.call({ dt: Time.now - last_time,
+                  epoch: epochs,
+                  output: output,
+                  cost: c,
+                  deltas: deltas
+                })
+  end
+end
+def backprop_digit(loops, rate, net, digit, initial_input = nil, verbose = false, status_delay = 5.0, to_ascii = true, to_sixel = false)
+  initial_input ||= CooCoo::Vector.zeros(net.num_inputs)
+  input = initial_input
+  target = CooCoo::Vector.zeros(net.num_outputs)
+  target[digit % net.num_outputs] = 1.0
+  target = net.prep_output_target(target)
+  sgd(epochs: loops, rate: rate, status_time: status_delay, verbose: verbose,
+      f: lambda do
+        output, hs = net.forward(input, {}, true, true)
+      end,
+      cost: lambda do |output, hs|
+        output.last - target
+      end,
+      loss: lambda do |c, output, hs|
+        deltas, hs = net.backprop(input, output, c, hs)
+        errs = net.transfer_errors(deltas)
+        x = errs.first
+      end,
+      update: lambda do |deltas, last_deltas|
+        input = input - deltas + last_deltas
+      end,
+      status: lambda do |opts|
+        puts("#{opts[:epoch]} #{digit} Input")
+        puts(output_to_sixel(input)) if to_sixel
+        puts(output_to_ascii(input)) if to_ascii
+        puts("Output: #{opts[:output][0].last[digit]}\t#{opts[:output][0].last}\n")
+        puts("Cost: #{opts[:cost].magnitude}\t#{opts[:cost]}\n")
+        puts
+      end)
+  input
+end
+options = OpenStruct.new
+options.model_path = nil
+options.loops = 10
+options.rate = 0.5
+options.initial_input = CooCoo::Vector.zeros(28 * 28)
+options.status_delay = 5.0
+options.ascii = true
+options.sixel = false
+opts = CooCoo::OptionParser.new do |o|
+  o.on('--print-values BOOL') do |bool|
+    options.print_values = bool =~ /(1|t(rue)?|f(false)?|y(es)?)/
+  end
+  o.on('--sixel', "toggles on the display of the dream as a Sixel graphic") do
+    options.sixel = !options.sixel
+  end
+  o.on('--ascii', "toggles off the display of the dream as ASCII") do
+    options.ascii = !options.ascii
+  end
+  o.on('--color BOOL', 'toggles the use of color in the ASCII dream') do |bool|
+    $use_color = bool =~ /(1|t(rue)?|f(false)?|y(es)?)/
+  end
+  o.on('-m', '--model PATH') do |path|
+    options.model_path = Pathname.new(path)
+  end
+  o.on('-l', '--loops NUMBER') do |n|
+    options.loops = n.to_i
+  end
+  o.on('-r', '--rate NUMBER') do |n|
+    options.rate = n.to_f
+  end
+  o.on('-v', '--verbose') do
+    options.verbose = true
+  end
+  o.on('--status-delay SECONDS') do |n|
+    options.status_delay = n.to_f
+  end
+  o.on('-i', '--initial NAME') do |n|
+    options.initial_input = case n[0].downcase
+                            when 'o' then CooCoo::Vector.ones(28 * 28)
+                            when 'r' then CooCoo::Vector.rand(28 * 28)
+                            when 'z' then CooCoo::Vector.zeros(28 * 28)
+                            when 'h' then CooCoo::Vector.new(28 * 28, 0.5)
+                            else raise ArgumentError.new("Unknown initial value #{n}")
+                            end
+  end
+end
+argv = opts.parse!(ARGV)
+net = if File.extname(options.model_path) == '.bin'
+        Marshal.load(File.read(options.model_path))
+      else
+        CooCoo::Network.load(options.model_path)
+      end
+argv = 10.times if argv.empty?
+argv.collect do |digit|
+  digit = digit.to_i
+  $stdout.puts("Generating #{digit}") if options.verbose
+  input = backprop_digit(options.loops, options.rate, net, digit.to_i, options.initial_input, options.verbose, options.status_delay, options.ascii, options.sixel)
+  $stdout.flush
+  [ digit, input ]
+end.each do |digit, input|
+  output, hs = net.predict(input, {})
+  passed = output[digit] > 0.8
+  color = passed ? :green : :red
+  status_char = passed ? "\u2714" : "\u2718"
+  puts("#{digit}".colorize(color))
+  puts('=' * 8)
+  puts
+  puts(output_to_sixel(input)) if options.sixel
+  puts(output_to_ascii(input)) if options.ascii
+  puts(input) if options.print_values
+  puts
+  puts("#{status_char.colorize(color)} Output #{output[digit]} #{output.magnitude} #{options.verbose ? output.inspect : ''}")
+  puts
+end