RubyGems - csv_madness - Versions diffs - 0.0.3 → 0.0.4 - Mend

csv_madness 0.0.3 → 0.0.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (12) hide show

data/CHANGELOG.markdown ADDED Viewed

@@ -0,0 +1,17 @@
+0.0.4
+=====
+* Fixed serious bug for default column names.  record.middle_name instead of record.middlename
+* Spreadsheet can be re-read from file by calling @sheet.reload_spreadsheet(opts)
+0.0.3
+=====
+* Feature:  can add and drop columns from spreadsheets
+0.0.2
+=====
+* Aw, hell.  I don't remember.

data/Gemfile CHANGED Viewed

@@ -5,6 +5,9 @@ source "http://rubygems.org"
 # Add dependencies to develop your gem here.
 # Include everything needed to run rake, tests, features, etc.
+gem "fun_with_files"
 group :development do
   gem "shoulda", ">= 0"
   gem "rdoc", "~> 3.12"

data/README.rdoc CHANGED Viewed

@@ -121,9 +121,9 @@ sheet.write_to_file( "~/data/people.clean.csv", force_quotes: true ) # save the
 You could do something similar to clean and standardize phone numbers, detect and delete/complete invalid emails, etc.
-=== Adding and removing columns
+=== Adding, removing, and renaming columns ===
-# Add 72 years to the date born.
+# Add 72 years to the date born.
 sheet.set_column_type( :born, :date )  # replace date strings with Time objects
 sheet.add_column( :expected_death_date ) do |date, record|
@@ -135,8 +135,10 @@ puts sheet[0].expected_death_date     # should be in 2058
 # But that's just morbid, so we drop the column
 sheet.drop_column( :expected_death_date )
+# Or, if you think you need the information, but need to be a bit more euphemistic about it
+sheet.rename_column( :expected_death_date, :expiration_date )
-=== Using columns
+=== Using columns ===
 sheet.set_column_type( :id, :integer )

data/Rakefile CHANGED Viewed

@@ -33,9 +33,11 @@ Jeweler::Tasks.new do |gem|
                 "./VERSION",
                 "./README.rdoc",
                 "./Rakefile",
+                "./CHANGELOG.markdown",
                 "./test/csv/simple.csv",
                 "./test/helper.rb",
-                "./test/test_csv_madness.rb" ]
+                "./test/test_csv_madness.rb",
+                "./test/test_sheet.rb" ]
 end
 Jeweler::RubygemsDotOrgTasks.new

data/VERSION CHANGED Viewed

	@@ -1 +1 @@
1	- 0.0.3
1	+ 0.0.4

data/lib/csv_madness/record.rb CHANGED Viewed

@@ -13,11 +13,21 @@ module CsvMadness
     end
     def [] key
-      @csv_data[key]
+      case key
+      when String, Integer
+        @csv_data[key]
+      when Symbol
+        @csv_data[key.to_s]
+      end
     end
     def []= key, val
-      @csv_data[key] = val
+      case key
+      when String, Integer
+        @csv_data[key] = val
+      when Symbol
+        @csv_data[key.to_s] = val
+      end
     end
     def columns
@@ -37,7 +47,7 @@ module CsvMadness
     end
     def blank?( col )
-      (self.send( col ).to_s || "").strip.length == 0
+      (self.send( col.to_sym ).to_s || "").strip.length == 0
     end
   end
 end

data/lib/csv_madness/sheet.rb CHANGED Viewed

@@ -30,7 +30,8 @@ module CsvMadness
     # Used to make getter/setter names out of the original header strings.
     # " hello;: world! " => :hello_world
     def self.getter_name( name )
-      name = name.strip.gsub(/\s+/,"_").gsub(/(\W|_)+/, "" ).downcase
+      name = name.strip.gsub( /\s+/, "_" ).gsub( /(\W|_)+/, "_" ).downcase
+      name = name.gsub( /_+$/, "" )
       if name.match( /^\d/ )
         name = "_#{name}"
       end
@@ -43,9 +44,17 @@ module CsvMadness
     def self.add_search_path( path )
       @search_paths ||= []
       path = Pathname.new( path ).expand_path
+      unless path.directory?
+        raise "The given path does not exist"
+      end
       @search_paths << path unless @search_paths.include?( path )
     end
+    def self.search_paths
+      @search_paths
+    end
     def self.from( csv_file, opts = {} )
       if f = find_spreadsheet_in_filesystem( csv_file )
         Sheet.new( f, opts )
@@ -83,7 +92,7 @@ module CsvMadness
     end
     def self.write_to_file( spreadsheet, file, opts = {} )
-      file = Pathname.new(file).expand_path
+      file = file.fwf_filepath.expand_path
       File.open( file, "w" ) do |f|
         f << spreadsheet.to_csv( opts )
       end
@@ -99,7 +108,7 @@ module CsvMadness
       end
     end
-    attr_reader :columns, :records, :spreadsheet_file, :record_class
+    attr_reader :columns, :index_columns, :records, :spreadsheet_file, :record_class
     # opts:
     #   index: ( [:id, :id2 ] )
     #       columns you want mapped for quick
@@ -115,28 +124,37 @@ module CsvMadness
     #   header:   false
     #       anything else, we assume the csv file has a header row
     def initialize( spreadsheet, opts = {} )
-      @spreadsheet_file = self.class.find_spreadsheet_in_filesystem( spreadsheet )
+      if spreadsheet.is_a?(Array)
+        @spreadsheet_file = nil
+      else
+        @spreadsheet_file = self.class.find_spreadsheet_in_filesystem( spreadsheet )
+      end
       @opts = opts
       @opts[:header] = (@opts[:header] == false ? false : true)  # true unless already explicitly set to false
+      reload_spreadsheet
+    end
+    def reload_spreadsheet( opts = @opts )
       load_csv
-      set_initial_columns( @opts[:columns] )
+      set_initial_columns( opts[:columns] )
       create_record_class
       package
-      @index_columns = case @opts[:index]
+      set_index_columns( opts[:index] )
+      reindex
+    end
+    def set_index_columns( index_columns )
+      @index_columns = case index_columns
       when NilClass
         []
       when Symbol
-        [ @opts[:index] ]
+        [ index_columns ]
       when Array
-        @opts[:index]
+        index_columns
       end
-      reindex
     end
     def [] offset
@@ -196,8 +214,9 @@ module CsvMadness
       end
     end
-    # if column doesn't exist, silently fails.  Proper behavior?  Dunno.
     def alter_column( column, blank = :undefined, &block )
+      raise "Column does not exist: #{column}" unless @columns.include?( column )
       if cindex = @columns.index( column )
         for record in @records
           if record.blank?(column) && blank != :undefined
@@ -209,8 +228,9 @@ module CsvMadness
       end
     end
+    # If no block given, adds an empty column
     def add_column( column, &block )
-      raise "Column already exists" if @columns.include?( column )
+      raise "Column already exists: #{column}" if @columns.include?( column )
       @columns << column
       # add empty column to each row
@@ -241,10 +261,45 @@ module CsvMadness
       update_data_accessor_module
     end
+    def rename_column( column, new_name )
+      @columns[@columns.index(column)] = new_name
+      rename_index_column( column, new_name ) if @index_columns.include?( column )
+      update_data_accessor_module
+    end
     def set_column_type( column, type, blank = :undefined )
       alter_column( column, blank, &COLUMN_TYPES[type] )
     end
+    # If :reverse_merge is true, then the dest column is only overwritten for records where :dest is blank
+    def merge_columns( source, dest, opts = {} )
+      opts = { :drop_source => true, :reverse_merge => false, :default => "" }.merge( opts )
+      column_must_exist( source, dest )
+      self.records.each do |record|
+        if opts[:reverse_merge] == false || record.blank?( dest )
+          record[dest] = record.blank?(source) ? opts[:default] : record[source]
+        end
+      end
+      self.drop_column( source ) if opts[:drop_source]
+    end
+    # By default, the
+    def concat_columns( col1, col2, opts = {} )
+      opts =  {:separator => '', :out => col1}.merge( opts )
+      column_must_exist( col1, col2 )
+      self.add_column( opts[:out] ) unless self.columns.include?( opts[:out] )
+      for record in self.records
+        record[ opts[:out] ] = "#{record[col1]}#{opts[:separator]}#{record[col2]}"
+      end
+    end
+    alias :concatenate :concat_columns
     # Note: If a block is given, the mod arg will be ignored.
     def add_record_methods( mod = nil, &block )
       if block_given?
@@ -285,6 +340,13 @@ module CsvMadness
       end
     end
+    # shouldn't require reindex
+    def rename_index_column( column, new_name )
+      @index_columns[ @index_columns.index( column ) ] = new_name
+      @indexes[new_name] = @indexes[column]
+      @indexes.delete(column)
+    end
     # Each spreadsheet has its own anonymous record class, and each CSV row instantiates
     # a record of this class.  This is where the getters and setters come from.
     def create_record_class
@@ -374,5 +436,11 @@ module CsvMadness
     def update_data_accessor_module
       @module.remap_accessors( columns_to_mapping )
     end
+    def column_must_exist( *cols )
+      for col in cols
+        raise ArgumentError.new( "#{caller[0]}: column :#{col} does not exist.") unless self.columns.include?(col)
+      end
+    end
   end
 end

data/lib/csv_madness.rb CHANGED Viewed

@@ -1,5 +1,5 @@
 require 'csv'
-require 'pathname'
+require 'fun_with_files'
 require 'time'        # to use Time.parse to parse cells to get the date
 require 'debugger'
@@ -7,6 +7,9 @@ require_relative 'csv_madness/data_accessor_module'
 require_relative 'csv_madness/sheet'
 require_relative 'csv_madness/record'
+FunWith::Files::RootPath.rootify( CsvMadness, __FILE__.fwf_filepath.dirname.up )
 CsvMadness.class_eval do
   def self.load( csv, opts = {} )
     CsvMadness::Sheet.from( csv, opts )

data/test/helper.rb CHANGED Viewed

@@ -19,3 +19,85 @@ require 'csv_madness'
 class Test::Unit::TestCase
 end
+class MadTestCase < Test::Unit::TestCase
+  MARY_ID = "1"
+  BILL_ID = "2"
+  DARWIN_ID = "3"
+  CHUCK_ID = "4"
+  def load_mary
+    id = @simple.index_columns.first
+    @mary = @simple.fetch( id, MARY_ID )
+  end
+  def load_bill
+    id = @simple.index_columns.first
+    @bill = @simple.fetch( id, BILL_ID )
+  end
+  def load_darwin
+    id = @simple.index_columns.first
+    @darwin = @simple.fetch( id, DARWIN_ID )
+  end
+  def load_chuck
+    id = @simple.index_columns.first
+    @chuck = @simple.fetch( id, CHUCK_ID )
+  end
+  def set_person_records
+    load_mary
+    load_darwin
+    load_bill
+    load_chuck
+  end
+  def muck_up_spreadsheet
+    @simple.add_column(:scrambled_name) do |val, record|
+      record.fname.chars.map(&:to_s).zip( record.lname.chars.map(&:to_s) ).flatten.compact.join
+    end
+    @simple.alter_column(:id) do |val|
+      (val.to_i << 8) % 27
+    end
+    @simple.set_column_type(:id, :float)
+    @simple.set_column_type(:born, :date)
+    @simple.alter_column(:born) do |val|
+      if val.is_a?(String)
+        -1.0
+      else
+        (Time.now - val).to_f
+      end
+    end
+    @simple.drop_column(:fname)
+    @simple.drop_column(:lname)
+  end
+  def set_spreadsheet_paths
+    @csv_search_path = Pathname.new( __FILE__ ).dirname.join("csv")
+    @csv_output_path = @csv_search_path.join("out")
+    CsvMadness::Sheet.add_search_path( @csv_search_path )
+    CsvMadness::Sheet.add_search_path( @csv_output_path )
+  end
+  def load_simple_spreadsheet
+    @simple = CsvMadness.load( "simple.csv", index: [:id] )
+  end
+  def unload_simple_spreadsheet
+    @simple = nil
+  end
+  def empty_output_folder
+    if defined?(FileUtils)
+      FileUtils.rm_rf( Dir.glob( @csv_output_path.join("**","*") ) )
+    else
+      puts "fileutils not defined"
+      `rm -rf #{@csv_output_path.join('*')}`
+    end
+  end
+end

data/test/test_csv_madness.rb CHANGED Viewed

@@ -1,26 +1,21 @@
 require 'helper'
-class TestCsvMadness < Test::Unit::TestCase
+class TestCsvMadness < MadTestCase
   context "all:" do
     setup do
-      @csv_search_path = Pathname.new( __FILE__ ).dirname.join("csv")
-      @csv_output_path = @csv_search_path.join("out")
-      CsvMadness::Sheet.add_search_path( @csv_search_path )
+      set_spreadsheet_paths
+      load_simple_spreadsheet
     end
     teardown do
-      if defined?(FileUtils)
-        FileUtils.rm_rf( Dir.glob( @csv_output_path.join("**","*") ) )
-      else
-        puts "fileutils not defined"
-        `rm -rf #{@csv_output_path.join('*')}`
-      end
+      empty_output_folder
     end
     context "testing sheet basics" do
       should "not accept duplicate search paths" do
+        @path_count = CsvMadness::Sheet.search_paths.length
         CsvMadness::Sheet.add_search_path( Pathname.new( __FILE__ ).dirname.join("csv") )
-        assert_equal 1, CsvMadness::Sheet.instance_variable_get("@search_paths").length
+        assert_equal @path_count, CsvMadness::Sheet.search_paths.length
       end
       should "load a simple spreadsheet" do
@@ -49,11 +44,11 @@ class TestCsvMadness < Test::Unit::TestCase
     context "testing transformations" do
       context "with a simple spreadsheet loaded" do
         setup do
-          @simple = CsvMadness.load( "simple.csv", index: [:id] )
+          load_simple_spreadsheet
         end
         teardown do
-          @simple = nil
+          unload_simple_spreadsheet
         end
         should "transform every cell" do
@@ -154,6 +149,49 @@ class TestCsvMadness < Test::Unit::TestCase
           assert_equal records.length, records.compact.length
           assert_equal 2, records.length
           assert_equal "1", records.first.id
+        end
+        should "rename columns" do
+          load_mary
+          assert_equal "Mary", @mary.fname
+          assert_equal "Moore", @mary.lname
+          assert_equal "Mary", @mary[1]
+          assert_equal "Moore", @mary[2]
+          @simple.rename_column( :fname, :first_name )
+          @simple.rename_column( :lname, :last_name )
+          assert_equal "Mary", @mary.first_name
+          assert_equal "Moore", @mary.last_name
+          assert_equal "Mary", @mary[1]
+          assert_equal "Moore", @mary[2]
+        end
+        should "rename an index column" do
+          @simple.rename_column( :id, :identifier )
+          @mary = @simple.fetch( :identifier, "1" )
+          assert_equal "1", @mary.identifier
+        end
+        should "rename an index column and ensure that the outputted spreadsheet has the new column name" do
+          @simple.rename_column( :id, :identifier )
+          @outfile = @csv_output_path.join("output.csv")
+          @simple.write_to_file( @outfile, force_quotes: true )
+          @simple = CsvMadness.load( @outfile, index: [:identifier] )
+          load_mary
+          assert_equal "Mary", @mary.fname
+        end
+        should "filter! records" do
+          @simple.filter! do |record|
+            record.id == BILL_ID || record.id == CHUCK_ID
+          end
+          assert_equal 2, @simple.records.length
         end
       end
     end
@@ -194,7 +232,7 @@ class TestCsvMadness < Test::Unit::TestCase
     context "testing add/remove column transformations" do
       context "with simple spreadsheet loaded" do
         setup do
-          load_simple
+          load_simple_spreadsheet
         end
         should "add column" do
@@ -221,12 +259,4 @@ class TestCsvMadness < Test::Unit::TestCase
       end
     end
   end
-  def load_simple
-    @simple = CsvMadness.load( "simple.csv", index: [:id] )
-  end
-  def load_mary
-    @mary = @simple.fetch( :id, "1" )
-  end
 end

data/test/test_sheet.rb ADDED Viewed

@@ -0,0 +1,24 @@
+require 'helper'
+class TestCsvMadness < MadTestCase
+  context "testing getter_name()" do
+    should "return proper function names" do
+      assert_equal :hello_world, CsvMadness::Sheet.getter_name( "  heLLo __ world " )
+      assert_equal :_0_hello_world, CsvMadness::Sheet.getter_name( "0  heLLo __ worlD!!! " )
+    end
+  end
+  context "testing default spreadsheet paths" do
+    should "only load existing paths" do
+      assert_raise(RuntimeError) do
+        CsvMadness::Sheet.add_search_path( CsvMadness.root.join("rocaganthor") )
+      end
+    end
+    should "check a search path for files to load" do
+      CsvMadness::Sheet.add_search_path( CsvMadness.root.join("test", "csv") )
+      sheet = CsvMadness.load( "with_nils.csv" )
+      assert sheet.is_a?(CsvMadness::Sheet)
+    end
+  end
+end

metadata CHANGED Viewed

@@ -1,7 +1,7 @@
 --- !ruby/object:Gem::Specification
 name: csv_madness
 version: !ruby/object:Gem::Version
-  version: 0.0.3
+  version: 0.0.4
   prerelease:
 platform: ruby
 authors:
@@ -9,8 +9,24 @@ authors:
 autorequire:
 bindir: bin
 cert_chain: []
-date: 2013-06-03 00:00:00.000000000 Z
+date: 2013-11-07 00:00:00.000000000 Z
 dependencies:
+- !ruby/object:Gem::Dependency
+  name: fun_with_files
+  requirement: !ruby/object:Gem::Requirement
+    none: false
+    requirements:
+    - - ! '>='
+      - !ruby/object:Gem::Version
+        version: '0'
+  type: :runtime
+  prerelease: false
+  version_requirements: !ruby/object:Gem::Requirement
+    none: false
+    requirements:
+    - - ! '>='
+      - !ruby/object:Gem::Version
+        version: '0'
 - !ruby/object:Gem::Dependency
   name: shoulda
   requirement: !ruby/object:Gem::Requirement
@@ -100,6 +116,7 @@ extra_rdoc_files:
 - LICENSE.txt
 - README.rdoc
 files:
+- ./CHANGELOG.markdown
 - ./Gemfile
 - ./README.rdoc
 - ./Rakefile
@@ -111,6 +128,7 @@ files:
 - ./test/csv/simple.csv
 - ./test/helper.rb
 - ./test/test_csv_madness.rb
+- ./test/test_sheet.rb
 - LICENSE.txt
 - README.rdoc
 homepage: http://github.com/darthschmoo/csv_madness
@@ -128,7 +146,7 @@ required_ruby_version: !ruby/object:Gem::Requirement
       version: '0'
       segments:
       - 0
-      hash: 2889880782640461400
+      hash: 1185350757253474800
 required_rubygems_version: !ruby/object:Gem::Requirement
   none: false
   requirements: