RubyGems - reckon - Versions diffs - 0.9.0 → 0.9.1 - Mend

reckon 0.9.0 → 0.9.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (31) hide show

checksums.yaml +4 -4
data/.github/workflows/ruby.yml +2 -0
data/.rubocop.yml +20 -0
data/CHANGELOG.md +10 -0
data/Gemfile.lock +1 -1
data/Rakefile +2 -2
data/bin/build-new-version.sh +3 -2
data/bin/reckon +1 -1
data/lib/reckon/app.rb +27 -24
data/lib/reckon/beancount_parser.rb +150 -0
data/lib/reckon/cosine_similarity.rb +0 -1
data/lib/reckon/csv_parser.rb +73 -37
data/lib/reckon/date_column.rb +18 -7
data/lib/reckon/ledger_parser.rb +23 -15
data/lib/reckon/money.rb +18 -16
data/lib/reckon/options.rb +44 -19
data/lib/reckon/version.rb +1 -1
data/lib/reckon.rb +1 -0
data/spec/cosine_training_and_test.rb +1 -1
data/spec/data_fixtures/multi-line-field.csv +5 -0
data/spec/integration/invalid_header_example/output.ledger +6 -7
data/spec/integration/invalid_header_example/test_args +1 -1
data/spec/integration/tab_delimited_file/input.csv +2 -0
data/spec/integration/tab_delimited_file/output.ledger +8 -0
data/spec/integration/tab_delimited_file/test_args +1 -0
data/spec/reckon/csv_parser_spec.rb +85 -26
data/spec/reckon/date_column_spec.rb +6 -0
data/spec/reckon/ledger_parser_spec.rb +25 -23
data/spec/reckon/options_spec.rb +2 -2
data/spec/spec_helper.rb +2 -0
metadata +8 -2

data/lib/reckon/date_column.rb CHANGED Viewed

@@ -2,13 +2,17 @@ module Reckon
   class DateColumn < Array
     attr_accessor :endian_precedence
     def initialize( arr = [], options = {} )
-      @options = options
+      # output date format
+      @ledger_date_format = options[:ledger_date_format]
+      # input date format
+      date_format = options[:date_format]
       arr.each do |value|
-        if options[:date_format]
+        if date_format
           begin
-            value = Date.strptime(value, options[:date_format])
+            value = Date.strptime(value, date_format)
           rescue
-            puts "I'm having trouble parsing '#{value}' with the desired format: #{options[:date_format]}"
+            puts "I'm having trouble parsing '#{value}' with the desired format: #{date_format}"
             exit 1
           end
         else
@@ -34,7 +38,7 @@ module Reckon
         self.push( value )
       end
       # if endian_precedence still nil, raise error
-      unless @endian_precedence || options[:date_format]
+      unless @endian_precedence || date_format
         raise( "Unable to determine date format. Please specify using --date-format" )
       end
     end
@@ -54,7 +58,7 @@ module Reckon
       date = self.for(index)
       return "" if date.nil?
-      date.strftime(@options[:ledger_date_format] || '%Y-%m-%d')
+      date.strftime(@ledger_date_format || '%Y-%m-%d')
     end
     def self.likelihood(entry)
@@ -65,7 +69,14 @@ module Reckon
       date_score -= entry.gsub(/[\-\/\.\d:\[\]]/, '').length
       date_score += 30 if entry =~ /^\d+[:\/\.-]\d+[:\/\.-]\d+([ :]\d+[:\/\.]\d+)?$/
       date_score += 10 if entry =~ /^\d+\[\d+:GMT\]$/i
-      return date_score
+      begin
+        DateTime.parse(entry)
+        date_score += 20
+      rescue Date::Error, ArgumentError
+      end
+      date_score
     end
   end
 end

data/lib/reckon/ledger_parser.rb CHANGED Viewed

@@ -1,4 +1,3 @@
-#!/usr/bin/env ruby
 # frozen_string_literal: true
 # From: https://www.ledger-cli.org/3.0/doc/ledger3.html#Transactions-and-Comments
@@ -110,20 +109,20 @@ require 'rubygems'
 module Reckon
   class LedgerParser
-    attr_accessor :entries
-    def initialize(ledger, options = {})
+    # ledger is an object that response to #each_line,
+    # (i.e. a StringIO or an IO object)
+    def initialize(options = {})
       @options = options
       @date_format = options[:ledger_date_format] || options[:date_format] || '%Y-%m-%d'
-      parse(ledger)
     end
     def parse(ledger)
-      @entries = []
+      entries = []
       new_entry = {}
       in_comment = false
       comment_chars = ';#%*|'
-      ledger.strip.split("\n").each do |entry|
+      ledger.each_line do |entry|
+        entry.rstrip!
         # strip comment lines
         in_comment = true if entry == 'comment'
         in_comment = false if entry == 'end comment'
@@ -132,7 +131,7 @@ module Reckon
         # (date, type, code, description), type and code are optional
         if (m = entry.match(%r{^(\d+[\d/-]+)\s+([*!])?\s*(\([^)]+\))?\s*(.*)$}))
-          add_entry(new_entry)
+          add_entry(entries, new_entry)
           new_entry = {
             date: try_parse_date(m[1]),
             type: m[2] || "",
@@ -141,23 +140,24 @@ module Reckon
             accounts: []
           }
         elsif entry =~ /^\s*$/ && new_entry[:date]
-          add_entry(new_entry)
+          add_entry(entries,new_entry)
           new_entry = {}
         elsif new_entry[:date] && entry =~ /^\s+/
           LOGGER.info("Adding new account #{entry}")
           new_entry[:accounts] << parse_account_line(entry)
         else
           LOGGER.info("Unknown entry type: #{entry}")
-          add_entry(new_entry)
+          add_entry(entries, new_entry)
           new_entry = {}
         end
       end
-      add_entry(new_entry)
+      add_entry(entries, new_entry)
+      entries
     end
     # roughly matches ledger csv format
-    def to_csv
-      return @entries.flat_map do |n|
+    def to_csv(ledger)
+      return parse(ledger).flat_map do |n|
         n[:accounts].map do |a|
           row = [
             n[:date].strftime(@date_format),
@@ -174,13 +174,21 @@ module Reckon
       end
     end
+    def format_row(row, line1, line2)
+      out = "#{row[:pretty_date]}\t#{row[:description]}#{row[:note] ? "\t; " + row[:note]: ""}\n"
+      out += "\t#{line1.first}\t\t\t#{line1.last}\n"
+      out += "\t#{line2.first}\t\t\t#{line2.last}\n\n"
+      out
+    end
     private
-    def add_entry(entry)
+    def add_entry(entries, entry)
       return unless entry[:date] && entry[:accounts].length > 1
       entry[:accounts] = balance(entry[:accounts])
-      @entries << entry
+      entries << entry
     end
     def try_parse_date(date_str)

data/lib/reckon/money.rb CHANGED Viewed

@@ -6,11 +6,10 @@ module Reckon
     include Comparable
     attr_accessor :amount, :currency, :suffixed
     def initialize(amount, options = {})
-      @options = options
       @amount_raw = amount
       @raw = options[:raw]
-      @amount = parse(amount, options)
+      @amount = parse(amount, options[:comma_separates_cents])
       @amount = -@amount if options[:inverse]
       @currency = options[:currency] || "$"
       @suffixed = options[:suffixed]
@@ -21,7 +20,7 @@ module Reckon
     end
     def to_s
-      return @options[:raw] ? "#{@amount_raw} | #{@amount}" : @amount
+      return @raw ? "#{@amount_raw} | #{@amount}" : @amount
     end
     # unary minus
@@ -60,34 +59,37 @@ module Reckon
       return (@amount >= 0 ? " " : "") + amt
     end
+    def self.likelihood(entry)
+      money_score = 0
+      # digits separated by , or . with no more than 2 trailing digits
+      money_score += 40 if entry.match(/\d+[,.]\d{2}[^\d]*$/)
+      money_score += 10 if entry[/^\$?\-?\$?\d+[\.,\d]*?[\.,]\d\d$/]
+      money_score += 10 if entry[/\d+[\.,\d]*?[\.,]\d\d$/]
+      money_score += entry.gsub(/[^\d\.\-\+,\(\)]/, '').length if entry.length < 7
+      money_score -= entry.length if entry.length > 12
+      money_score -= 20 if (entry !~ /^[\$\+\.\-,\d\(\)]+$/) && entry.length > 0
+      money_score
+    end
+    private
     def pretty_amount(amount)
       sprintf("%0.2f", amount).reverse.gsub(/(\d{3})(?=\d)/, '\\1,').reverse
     end
-    def parse(value, options = {})
+    def parse(value, comma_separates_cents)
       value = value.to_s
       # Empty string is treated as money with value 0
       return value.to_f if value.to_s.empty?
       invert = value.match(/^\(.*\)$/)
       value = value.gsub(/[^0-9,.-]/, '')
-      value = value.tr('.', '').tr(',', '.') if options[:comma_separates_cents]
+      value = value.tr('.', '').tr(',', '.') if comma_separates_cents
       value = value.tr(',', '')
       value = value.to_f
       return invert ? -value : value
     end
-    def Money::likelihood(entry)
-      money_score = 0
-      # digits separated by , or . with no more than 2 trailing digits
-      money_score += 40 if entry.match(/\d+[,.]\d{2}[^\d]*$/)
-      money_score += 10 if entry[/^\$?\-?\$?\d+[\.,\d]*?[\.,]\d\d$/]
-      money_score += 10 if entry[/\d+[\.,\d]*?[\.,]\d\d$/]
-      money_score += entry.gsub(/[^\d\.\-\+,\(\)]/, '').length if entry.length < 7
-      money_score -= entry.length if entry.length > 12
-      money_score -= 20 if (entry !~ /^[\$\+\.\-,\d\(\)]+$/) && entry.length > 0
-      money_score
-    end
   end
   class MoneyColumn < Array

data/lib/reckon/options.rb CHANGED Viewed

@@ -1,8 +1,10 @@
+# frozen_string_literal: true
 module Reckon
+  # Singleton class for parsing command line flags
   class Options
-    @@cli = HighLine.new
-    def self.parse(args = ARGV, stdin = $stdin)
+    def self.parse_command_line_options(args = ARGV, stdin = $stdin)
+      cli = HighLine.new
       options = { output_file: $stdout }
       OptionParser.new do |opts|
         opts.banner = "Usage: Reckon.rb [options]"
@@ -32,19 +34,23 @@ module Reckon
           options[:output_file] = File.open(o, 'a')
         end
-        opts.on("-l", "--learn-from FILE", "An existing ledger file to learn accounts from") do |l|
+        opts.on("-l", "--learn-from FILE",
+                "An existing ledger file to learn accounts from") do |l|
           options[:existing_ledger_file] = l
         end
-        opts.on("", "--ignore-columns 1,2,5", "Columns to ignore, starts from 1") do |ignore|
+        opts.on("", "--ignore-columns 1,2,5",
+                "Columns to ignore, starts from 1") do |ignore|
           options[:ignore_columns] = ignore.split(",").map(&:to_i)
         end
-        opts.on("", "--money-column 2", Integer, "Column number of the money column, starts from 1") do |col|
+        opts.on("", "--money-column 2", Integer,
+                "Column number of the money column, starts from 1") do |col|
           options[:money_column] = col
         end
-        opts.on("", "--money-columns 2,3", "Column number of the money columns, starts from 1 (1 or 2 columns)") do |ignore|
+        opts.on("", "--money-columns 2,3",
+                "Column number of the money columns, starts from 1 (1 or 2 columns)") do |ignore|
           options[:money_columns] = ignore.split(",").map(&:to_i)
         end
@@ -52,20 +58,28 @@ module Reckon
           options[:raw] = n
         end
-        opts.on("", "--date-column 3", Integer, "Column number of the date column, starts from 1") do |col|
+        opts.on("", "--date-column 3", Integer,
+                "Column number of the date column, starts from 1") do |col|
           options[:date_column] = col
         end
-        opts.on("", "--contains-header [N]", Integer, "Skip N header rows - default 1") do |hdr|
+        opts.on("", "--contains-header [N]", Integer,
+                "Skip N header rows - default 1") do |hdr|
           options[:contains_header] = 1
           options[:contains_header] = hdr.to_i
         end
+        opts.on("", "--contains-footer [N]", Integer,
+                "Skip N footer rows - default 0") do |hdr|
+          options[:contains_footer] = hdr.to_i || 0
+        end
         opts.on("", "--csv-separator ','", "CSV separator (default ',')") do |sep|
           options[:csv_separator] = sep
         end
-        opts.on("", "--comma-separates-cents", "Use comma to separate cents ($100,50 vs. $100.50)") do |c|
+        opts.on("", "--comma-separates-cents",
+                "Use comma to separate cents ($100,50 vs. $100.50)") do |c|
           options[:comma_separates_cents] = c
         end
@@ -73,23 +87,28 @@ module Reckon
           options[:encoding] = e
         end
-        opts.on("-c", "--currency '$'", "Currency symbol to use - default $ (ex £, EUR)") do |e|
-          options[:currency] = e
+        opts.on("-c", "--currency '$'",
+                "Currency symbol to use - default $ (ex £, EUR)") do |e|
+          options[:currency] = e || '$'
         end
-        opts.on("", "--date-format FORMAT", "CSV file date format (see `date` for format)") do |d|
+        opts.on("", "--date-format FORMAT",
+                "CSV file date format (see `date` for format)") do |d|
           options[:date_format] = d
         end
-        opts.on("", "--ledger-date-format FORMAT", "Ledger date format (see `date` for format)") do |d|
+        opts.on("", "--ledger-date-format FORMAT",
+                "Ledger date format (see `date` for format)") do |d|
           options[:ledger_date_format] = d
         end
-        opts.on("-u", "--unattended", "Don't ask questions and guess all the accounts automatically. Use with --learn-from or --account-tokens options.") do |n|
+        opts.on("-u", "--unattended",
+                "Don't ask questions and guess all the accounts automatically. Use with --learn-from or --account-tokens options.") do |n|
           options[:unattended] = n
         end
-        opts.on("-t", "--account-tokens FILE", "YAML file with manually-assigned tokens for each account (see README)") do |a|
+        opts.on("-t", "--account-tokens FILE",
+                "YAML file with manually-assigned tokens for each account (see README)") do |a|
           options[:account_tokens_file] = a
         end
@@ -107,7 +126,8 @@ module Reckon
           options[:default_outof_account] = a
         end
-        opts.on("", "--fail-on-unknown-account", "Fail on unmatched transactions.") do |n|
+        opts.on("", "--fail-on-unknown-account",
+                "Fail on unmatched transactions.") do |n|
           options[:fail_on_unknown_account] = n
         end
@@ -115,6 +135,11 @@ module Reckon
           options[:suffixed] = e
         end
+        opts.on("", "--ledger-format FORMAT",
+                "Output/Learn format: BEANCOUNT or LEDGER. Default: LEDGER") do |n|
+          options[:format] = n
+        end
         opts.on_tail("-h", "--help", "Show this message") do
           puts opts
           exit
@@ -137,7 +162,7 @@ module Reckon
       end
       unless options[:file]
-        options[:file] = @@cli.ask("What CSV file should I parse? ")
+        options[:file] = cli.ask("What CSV file should I parse? ")
         unless options[:file].empty?
           puts "\nYou must provide a CSV file to parse.\n"
           puts parser
@@ -148,7 +173,7 @@ module Reckon
       unless options[:bank_account]
         raise "Must specify --account in unattended mode" if options[:unattended]
-        options[:bank_account] = @@cli.ask("What is this account named in Ledger?\n") do |q|
+        options[:bank_account] = cli.ask("What is this account named in Ledger?\n") do |q|
           q.readline = true
           q.validate = /^.{2,}$/
           q.default = "Assets:Bank:Checking"

data/lib/reckon/version.rb CHANGED Viewed

@@ -1,3 +1,3 @@
 module Reckon
-  VERSION="0.9.0"
+  VERSION = "0.9.1"
 end

data/lib/reckon.rb CHANGED Viewed

@@ -15,6 +15,7 @@ require_relative 'reckon/cosine_similarity'
 require_relative 'reckon/date_column'
 require_relative 'reckon/money'
 require_relative 'reckon/ledger_parser'
+require_relative 'reckon/beancount_parser'
 require_relative 'reckon/csv_parser'
 require_relative 'reckon/options'
 require_relative 'reckon/app'

data/spec/cosine_training_and_test.rb CHANGED Viewed

@@ -8,7 +8,7 @@ ledger_file = ARGV[0]
 account = ARGV[1]
 seed = ARGV[2] ? ARGV[2].to_i : Random.new_seed
-ledger = Reckon::LedgerParser.new(File.read(ledger_file))
+ledger = Reckon::LedgerParser.new(File.new(ledger_file))
 matcher = Reckon::CosineSimilarity.new({})
 train = []

data/spec/data_fixtures/multi-line-field.csv ADDED Viewed

@@ -0,0 +1,5 @@
+,311053760,2002-09-10T23:00:04,Merchant Transaction,Complete,,,"Lyft, Inc",- $21.59,,,,,,Venmo balance,,,,,Venmo,,
+,,,,,,,,,,,,,,,,,$23.40,$0.00,,$0.00,"In case of errors or questions about your
+        electronic transfers:
+        This is a multi-line string
+        "

data/spec/integration/invalid_header_example/output.ledger CHANGED Viewed

@@ -1,8 +1,7 @@
-4016-02-18
-	Assets:Bank:Checking			 $10.00
-	Income:Unknown
-4016-02-19
-	Income:Unknown
-	Assets:Bank:Checking			 $0.00
+2016-02-18	COTISATION JAZZ; COTISATION JAZZ; EUR
+	Expenses:Unknown
+	Assets:Bank:Checking			-$8.10
+2016-02-19	VIR RECU 508160; VIR RECU 1234567834S DE: Francois REF: 123457891234567894561231 PROVENANCE: DE Allemagne; EUR
+	Assets:Bank:Checking			 $50.00
+	Expenses:Unknown

data/spec/integration/invalid_header_example/test_args CHANGED Viewed

	@@ -1 +1 @@
1	- -f input.csv --unattended --account Assets:Bank:Checking --contains-header 4
1	+ -f input.csv --unattended --account Assets:Bank:Checking --contains-header 4 --comma-separates-cents --verbose

data/spec/integration/tab_delimited_file/input.csv ADDED Viewed

	@@ -0,0 +1,2 @@
1	+ 123456789 EUR 20160102 15,00 10,00 20160102 -5,00 DESCRIPTION
2	+ 123456789 EUR 20160102 10,00 0,00 20160102 -10,00 DESCRIPTION

data/spec/integration/tab_delimited_file/output.ledger ADDED Viewed

@@ -0,0 +1,8 @@
+2016-01-02	123456789; EUR; 20160102; DESCRIPTION
+	Expenses:Unknown
+	Test::Account			-€5.00
+2016-01-02	123456789; EUR; 20160102; DESCRIPTION
+	Expenses:Unknown
+	Test::Account			-€10.00

data/spec/integration/tab_delimited_file/test_args ADDED Viewed

	@@ -0,0 +1 @@
1	+ -f input.csv --unattended -c € --ignore-columns 4,5 --comma-separates-cents -v --date-format '%Y%m%d' --csv-separator '\t' -a Test::Account

data/spec/reckon/csv_parser_spec.rb CHANGED Viewed

@@ -1,5 +1,4 @@
 #!/usr/bin/env ruby
-# coding: utf-8
 require_relative "../spec_helper"
 require 'rubygems'
@@ -8,24 +7,53 @@ require_relative '../../lib/reckon'
 describe Reckon::CSVParser do
   let(:chase) { Reckon::CSVParser.new(file: fixture_path('chase.csv')) }
   let(:some_other_bank) { Reckon::CSVParser.new(file: fixture_path('some_other.csv')) }
-  let(:two_money_columns) { Reckon::CSVParser.new(file: fixture_path('two_money_columns.csv')) }
+  let(:two_money_columns) {
+    Reckon::CSVParser.new(file: fixture_path('two_money_columns.csv'))
+  }
   let(:suntrust_csv) { Reckon::CSVParser.new(file: fixture_path('suntrust.csv')) }
   let(:simple_csv) { Reckon::CSVParser.new(file: fixture_path('simple.csv')) }
-  let(:nationwide) { Reckon::CSVParser.new(file: fixture_path('nationwide.csv'), csv_separator: ',', suffixed: true, currency: "POUND") }
-  let(:german_date) { Reckon::CSVParser.new(file: fixture_path('german_date_example.csv')) }
-  let(:danish_kroner_nordea) { Reckon::CSVParser.new(file: fixture_path('danish_kroner_nordea_example.csv'), csv_separator: ';', comma_separates_cents: true) }
-  let(:yyyymmdd_date) { Reckon::CSVParser.new(file: fixture_path('yyyymmdd_date_example.csv')) }
-  let(:spanish_date) { Reckon::CSVParser.new(file: fixture_path('spanish_date_example.csv'), date_format: '%d/%m/%Y') }
-  let(:english_date) { Reckon::CSVParser.new(file: fixture_path('english_date_example.csv')) }
-  let(:ing_csv) { Reckon::CSVParser.new(file: fixture_path('ing.csv'), comma_separates_cents: true ) }
-  let(:austrian_csv) { Reckon::CSVParser.new(file: fixture_path('austrian_example.csv'), comma_separates_cents: true, csv_separator: ';' ) }
-  let(:french_csv) { Reckon::CSVParser.new(file: fixture_path('french_example.csv'), csv_separator: ';', comma_separates_cents: true) }
-  let(:broker_canada) { Reckon::CSVParser.new(file: fixture_path('broker_canada_example.csv')) }
-  let(:intuit_mint) { Reckon::CSVParser.new(file: fixture_path('intuit_mint_example.csv')) }
+  let(:nationwide) {
+    Reckon::CSVParser.new(file: fixture_path('nationwide.csv'), csv_separator: ',',
+                          suffixed: true, currency: "POUND")
+  }
+  let(:german_date) {
+    Reckon::CSVParser.new(file: fixture_path('german_date_example.csv'))
+  }
+  let(:danish_kroner_nordea) {
+    Reckon::CSVParser.new(file: fixture_path('danish_kroner_nordea_example.csv'),
+                          csv_separator: ';', comma_separates_cents: true)
+  }
+  let(:yyyymmdd_date) {
+    Reckon::CSVParser.new(file: fixture_path('yyyymmdd_date_example.csv'))
+  }
+  let(:spanish_date) {
+    Reckon::CSVParser.new(file: fixture_path('spanish_date_example.csv'),
+                          date_format: '%d/%m/%Y')
+  }
+  let(:english_date) {
+    Reckon::CSVParser.new(file: fixture_path('english_date_example.csv'))
+  }
+  let(:ing_csv) {
+    Reckon::CSVParser.new(file: fixture_path('ing.csv'), comma_separates_cents: true)
+  }
+  let(:austrian_csv) {
+    Reckon::CSVParser.new(file: fixture_path('austrian_example.csv'),
+                          comma_separates_cents: true, csv_separator: ';')
+  }
+  let(:french_csv) {
+    Reckon::CSVParser.new(file: fixture_path('french_example.csv'), csv_separator: ';',
+                          comma_separates_cents: true)
+  }
+  let(:broker_canada) {
+    Reckon::CSVParser.new(file: fixture_path('broker_canada_example.csv'))
+  }
+  let(:intuit_mint) {
+    Reckon::CSVParser.new(file: fixture_path('intuit_mint_example.csv'))
+  }
   describe "parse" do
     it "should use binary encoding if none specified and chardet fails" do
-      allow(CharDet).to receive(:detect).and_return({'encoding' => nil})
+      allow(CharDet).to receive(:detect).and_return({ 'encoding' => nil })
       app = Reckon::CSVParser.new(file: fixture_path("extratofake.csv"))
       expect(app.send(:try_encoding, "foobarbaz")).to eq("BINARY")
     end
@@ -37,12 +65,16 @@ describe Reckon::CSVParser do
     end
     it "should work with other separators" do
-      Reckon::CSVParser.new(:string => "one;two\nthree;four", :csv_separator => ';').columns.should == [['one', 'three'], ['two', 'four']]
+      Reckon::CSVParser.new(:string => "one;two\nthree;four",
+                            :csv_separator => ';').columns.should == [
+                              ['one', 'three'], ['two', 'four']
+                            ]
     end
     it 'should parse quoted lines' do
       file = %q("30.03.2015";"29.03.2015";"09.04.2015";"BARAUSZAHLUNGSENTGELT";"5266 xxxx xxxx 9454";"";"0";"EUR";"0,00";"EUR";"-3,50";"0")
-      Reckon::CSVParser.new(string: file, csv_separator: ';', comma_separates_cents: true).columns.length.should == 12
+      Reckon::CSVParser.new(string: file, csv_separator: ';',
+                            comma_separates_cents: true).columns.length.should == 12
     end
     it 'should parse csv with BOM' do
@@ -50,11 +82,26 @@ describe Reckon::CSVParser do
       Reckon::CSVParser.new(file: file).columns.length.should == 41
     end
+    it 'should parse multi-line csv fields' do
+      file = File.expand_path(fixture_path("multi-line-field.csv"))
+      p = Reckon::CSVParser.new(file: file)
+      expect(p.columns[0].length).to eq 2
+      expected_field = "In case of errors or questions about your\n" +
+                       "        electronic transfers:\n" +
+                       "        This is a multi-line string\n" +
+                       "        "
+      expect(p.columns[-1][-1]).to eq expected_field
+    end
     describe 'file with invalid csv in header' do
       let(:invalid_file) { fixture_path('invalid_header_example.csv') }
       it 'should ignore invalid header lines' do
-        Reckon::CSVParser.new(file: invalid_file, contains_header: 4)
+        parser = Reckon::CSVParser.new(file: invalid_file, contains_header: 4)
+        expect(parser.csv_data).to eq([
+                                        ["19/02/2016", "VIR RECU 508160",
+                                         "VIR RECU 1234567834S DE: Francois REF: 123457891234567894561231 PROVENANCE: DE Allemagne ", "50,00", "EUR"], ["18/02/2016", "COTISATION JAZZ", "COTISATION JAZZ ", "-8,10", "EUR"]
+                                      ])
       end
       it 'should fail' do
@@ -67,19 +114,24 @@ describe Reckon::CSVParser do
   describe "columns" do
     it "should return the csv transposed" do
-      simple_csv.columns.should == [["entry1", "entry4"], ["entry2", "entry5"], ["entry3", "entry6"]]
+      simple_csv.columns.should == [["entry1", "entry4"], ["entry2", "entry5"],
+                                    ["entry3", "entry6"]]
       chase.columns.length.should == 4
     end
     it "should be ok with empty lines" do
       lambda {
-        Reckon::CSVParser.new(:string => "one,two\nthree,four\n\n\n\n\n").columns.should == [['one', 'three'], ['two', 'four']]
+        Reckon::CSVParser.new(:string => "one,two\nthree,four\n\n\n\n\n").columns.should == [
+          ['one', 'three'], ['two', 'four']
+        ]
       }.should_not raise_error
     end
   end
   describe "detect_columns" do
-    let(:harder_date_example_csv) { Reckon::CSVParser.new(file: fixture_path('harder_date_example.csv')) }
+    let(:harder_date_example_csv) {
+      Reckon::CSVParser.new(file: fixture_path('harder_date_example.csv'))
+    }
     it "should detect the money column" do
       chase.money_column_indices.should == [3]
@@ -165,13 +217,17 @@ describe Reckon::CSVParser do
     end
     it "should handle the comma_separates_cents option correctly" do
-      european_csv = Reckon::CSVParser.new(:string => "$2,00;something\n1.025,67;something else", :csv_separator => ';', :comma_separates_cents => true)
+      european_csv = Reckon::CSVParser.new(
+        :string => "$2,00;something\n1.025,67;something else", :csv_separator => ';', :comma_separates_cents => true
+      )
       european_csv.money_for(0).should == 2.00
       european_csv.money_for(1).should == 1025.67
     end
     it "should return negated values if the inverse option is passed" do
-      inversed_csv = Reckon::CSVParser.new(file: fixture_path('inversed_credit_card.csv'), inverse: true)
+      inversed_csv = Reckon::CSVParser.new(
+        file: fixture_path('inversed_credit_card.csv'), inverse: true
+      )
       inversed_csv.money_for(0).should == -30.00
       inversed_csv.money_for(3).should == 500.00
     end
@@ -229,7 +285,8 @@ describe Reckon::CSVParser do
     end
     it "should not append empty description column" do
-      parser = Reckon::CSVParser.new(:string => '01/09/2015,05354 SUBWAY,8.19,,',:date_format => '%d/%m/%Y')
+      parser = Reckon::CSVParser.new(:string => '01/09/2015,05354 SUBWAY,8.19,,',
+                                     :date_format => '%d/%m/%Y')
       parser.description_for(0).should == '05354 SUBWAY'
     end
@@ -249,7 +306,8 @@ describe Reckon::CSVParser do
     end
     it "work with other currencies such as €" do
-      euro_bank = Reckon::CSVParser.new(file: fixture_path('some_other.csv'), currency: "€", suffixed: false )
+      euro_bank = Reckon::CSVParser.new(file: fixture_path('some_other.csv'),
+                                        currency: "€", suffixed: false)
       euro_bank.pretty_money_for(1).should == "-€20.00"
       euro_bank.pretty_money_for(4).should == " €1,558.52"
       euro_bank.pretty_money_for(7).should == "-€116.22"
@@ -258,7 +316,8 @@ describe Reckon::CSVParser do
     end
     it "work with suffixed currencies such as SEK" do
-      swedish_bank = Reckon::CSVParser.new(file: fixture_path('some_other.csv'), currency: 'SEK', suffixed: true )
+      swedish_bank = Reckon::CSVParser.new(file: fixture_path('some_other.csv'),
+                                           currency: 'SEK', suffixed: true)
       swedish_bank.pretty_money_for(1).should == "-20.00 SEK"
       swedish_bank.pretty_money_for(4).should == " 1,558.52 SEK"
       swedish_bank.pretty_money_for(7).should == "-116.22 SEK"
@@ -274,7 +333,7 @@ describe Reckon::CSVParser do
   describe '85 regression test' do
     it 'should detect correct date column' do
-      p = Reckon::CSVParser.new(file:fixture_path('85-date-example.csv'))
+      p = Reckon::CSVParser.new(file: fixture_path('85-date-example.csv'))
       expect(p.date_column_index).to eq(2)
     end
   end

data/spec/reckon/date_column_spec.rb CHANGED Viewed

@@ -50,4 +50,10 @@ describe Reckon::DateColumn do
         .to eq('2013-12-13')
     end
   end
+  describe "#likelihood" do
+    it "should prefer numbers that looks like dates" do
+      expect(Reckon::DateColumn.likelihood("123456789")).to be < Reckon::DateColumn.likelihood("20160102")
+    end
+  end
 end