tabtools 0.0.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -0,0 +1,86 @@
1
+ require 'csv'
2
+
3
+ class Anonymizer
4
+
5
+ attr_reader :anonWords, :low, :high
6
+ attr_accessor :input, :output, :field
7
+
8
+ @minWords = 2
9
+ @maxWords = 4
10
+
11
+ @@anonymousText = <<ANONTEXT
12
+ Lorem ipsum dolor sit amet consectetur adipiscing elit Mauris urna erat volutpat a ullamcorper sit amet
13
+ convallis quis dui Ut sem erat euismod in iaculis id tincidunt aliquam magna Vivamus lobortis eu erat in feugiat
14
+ Vestibulum fermentum dictum fermentum Class aptent taciti sociosqu ad litora torquent per conubia nostra
15
+ per inceptos himenaeos Ut quis rutrum mi Mauris sit amet cursus nisi Suspendisse accumsan leo ac lobortis egestas
16
+ sapien eros mattis lorem eu posuere mi justo in nunc Sed felis ligula egestas vel nulla sed egestas lobortis justo
17
+ Donec quis interdum velit Proin felis arcu vestibulum non augue nec ultricies pulvinar velit Nunc ac libero velit
18
+ Aenean bibendum varius nisi ut molestie Nam tempus nec lacus eget malesuada Donec et accumsan dolor et ullamcorper ante
19
+ Etiam quis consectetur leo Suspendisse mattis sagittis imperdiet Phasellus facilisis eget justo ac mollis
20
+ Phasellus eleifend tortor est sit amet venenatis enim fringilla id Vestibulum rutrum tempus tortor ac volutpat
21
+ Nullam non imperdiet lorem Cras tincidunt porttitor condimentum Pellentesque tincidunt magna id aliquet interdum augue
22
+ nisl convallis enim volutpat mollis urna metus et lacus Donec tortor sapien ultrices sit amet blandit quis gravida ut
23
+ massa Mauris mauris lacus pretium sit amet risus quis blandit viverra lorem Nunc fringilla elit a elementum gravida
24
+ Duis vel sodales elit eget tempor leo Quisque in semper nisl Fusce eget risus sollicitudin molestie diam et tincidunt
25
+ sem Curabitur accumsan pretium interdum Suspendisse semper enim ac augue hendrerit vel sollicitudin diam mollis
26
+ Curabitur lacinia ante nec eros maximus a vehicula velit aliquet In ullamcorper nec ante eu dictum Proin mi enim
27
+ malesuada ut ornare sit amet maximus commodo ipsum Nullam venenatis purus non sollicitudin sollicitudin augue
28
+ augue euismod lorem ut hendrerit velit neque sed nibh Class aptent taciti sociosqu ad litora torquent per conubia
29
+ nostra per inceptos himenaeos Proin ac elementum nisl
30
+ ANONTEXT
31
+
32
+ @codedWords = {}
33
+
34
+ def initialize
35
+ @anonWords = @@anonymousText.gsub(/\n/,' ').split
36
+ @coded = {}
37
+ @low = 0
38
+ @limit = @anonWords.length-1
39
+ @rand = Random.new
40
+ @minWords = 2
41
+ @maxWords = 4
42
+ end
43
+
44
+ def anonymize(input, fields, output)
45
+ puts "Anonymizing %-25s to %-25s - %s " % [input, output, fields.inspect]
46
+ raise 'The input file must be specified' if input.nil?
47
+ raise 'The input file must exist' unless File.exist?(input)
48
+ raise 'The field(s) to anonymize must be provided as a String or an array of Strings' unless fields.instance_of?(String) || fields.instance_of?(Array)
49
+ @input = input
50
+ @output = output
51
+ @anonVals = {}
52
+ csvFields = CSV.open(@input, &:readline)
53
+ output = CSV.open(@output,'w')
54
+ output << csvFields
55
+ fields = [fields] if fields.is_a? String
56
+ CSV.foreach('input.csv', :headers => true) do |row|
57
+ puts "--"
58
+ fields.each do |field|
59
+ puts "fld: #{field}"
60
+ puts "pre: #{row.inspect}"
61
+ row[field] = anonWords(row[field]) unless row[field].nil?
62
+ puts "pst: #{row.inspect}"
63
+ end
64
+ output << row
65
+ end
66
+ end
67
+
68
+ def anonWords value
69
+ return @anonVals[value] unless @anonVals[value].nil?
70
+ range = rand(@minWords..@maxWords)
71
+ limit = @limit - range
72
+ first = rand(range..limit)
73
+ last = first + range - 1
74
+ words = @anonWords[first..last].join(' ')
75
+ @anonVals[value] = words
76
+ end
77
+
78
+ def codeValue value
79
+ if @codedWords[value].nil?
80
+ @codedWords[value] = anonWords
81
+ end
82
+ @codedWords[value]
83
+ end
84
+
85
+
86
+ end # class Anonymizer
data/lib/tabtools.rb ADDED
@@ -0,0 +1,22 @@
1
+ # Copyright (C) 2014, 2018 Chris Gerrard
2
+ #
3
+ # This program is free software: you can redistribute it and/or modify
4
+ # it under the terms of the GNU General Public License as published by
5
+ # the Free Software Foundation, either version 3 of the License, or
6
+ # (at your option) any later version.
7
+ #
8
+ # This program is distributed in the hope that it will be useful,
9
+ # but WITHOUT ANY WARRANTY; without even the implied warranty of
10
+ # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
11
+ # GNU General Public License for more details.
12
+ #
13
+ # You should have received a copy of the GNU General Public License
14
+ # along with this program. If not, see <http://www.gnu.org/licenses/>.
15
+
16
+ require_relative 'tabtools/utilities/anonymizer'
17
+
18
+ # Represents Tableau Workbooks and their contents.
19
+ #
20
+ module TabTools
21
+ VERSION = '0.0.1'
22
+ end
metadata ADDED
@@ -0,0 +1,50 @@
1
+ --- !ruby/object:Gem::Specification
2
+ name: tabtools
3
+ version: !ruby/object:Gem::Version
4
+ version: 0.0.1
5
+ platform: ruby
6
+ authors:
7
+ - Chris Gerrard
8
+ autorequire:
9
+ bindir: bin
10
+ cert_chain: []
11
+ date: 2018-02-01 00:00:00.000000000 Z
12
+ dependencies: []
13
+ description: A collection of Ruby classes designed for accessing and recording information
14
+ about, producing documentation about, and for manipulating Tableau Workbooks and
15
+ their contents.
16
+ email: Chris@Gerrard.net
17
+ executables: []
18
+ extensions: []
19
+ extra_rdoc_files: []
20
+ files:
21
+ - LICENSE.md
22
+ - LICENSE.txt
23
+ - README.md
24
+ - lib/tabtools.rb
25
+ - lib/tabtools/utilities/anonymizer.rb
26
+ homepage: http://rubygems.org/gems/tabtools
27
+ licenses:
28
+ - GPL-3.0
29
+ metadata: {}
30
+ post_install_message:
31
+ rdoc_options: []
32
+ require_paths:
33
+ - lib
34
+ required_ruby_version: !ruby/object:Gem::Requirement
35
+ requirements:
36
+ - - ">="
37
+ - !ruby/object:Gem::Version
38
+ version: '0'
39
+ required_rubygems_version: !ruby/object:Gem::Requirement
40
+ requirements:
41
+ - - ">="
42
+ - !ruby/object:Gem::Version
43
+ version: '0'
44
+ requirements: []
45
+ rubyforge_project:
46
+ rubygems_version: 2.6.13
47
+ signing_key:
48
+ specification_version: 4
49
+ summary: Classes for analyzing, documenting, and managing Tableau Workbooks.
50
+ test_files: []