tabtools 0.0.1
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +7 -0
- data/LICENSE.md +619 -0
- data/LICENSE.txt +619 -0
- data/README.md +39 -0
- data/lib/tabtools/utilities/anonymizer.rb +86 -0
- data/lib/tabtools.rb +22 -0
- metadata +50 -0
@@ -0,0 +1,86 @@
|
|
1
|
+
require 'csv'
|
2
|
+
|
3
|
+
class Anonymizer
|
4
|
+
|
5
|
+
attr_reader :anonWords, :low, :high
|
6
|
+
attr_accessor :input, :output, :field
|
7
|
+
|
8
|
+
@minWords = 2
|
9
|
+
@maxWords = 4
|
10
|
+
|
11
|
+
@@anonymousText = <<ANONTEXT
|
12
|
+
Lorem ipsum dolor sit amet consectetur adipiscing elit Mauris urna erat volutpat a ullamcorper sit amet
|
13
|
+
convallis quis dui Ut sem erat euismod in iaculis id tincidunt aliquam magna Vivamus lobortis eu erat in feugiat
|
14
|
+
Vestibulum fermentum dictum fermentum Class aptent taciti sociosqu ad litora torquent per conubia nostra
|
15
|
+
per inceptos himenaeos Ut quis rutrum mi Mauris sit amet cursus nisi Suspendisse accumsan leo ac lobortis egestas
|
16
|
+
sapien eros mattis lorem eu posuere mi justo in nunc Sed felis ligula egestas vel nulla sed egestas lobortis justo
|
17
|
+
Donec quis interdum velit Proin felis arcu vestibulum non augue nec ultricies pulvinar velit Nunc ac libero velit
|
18
|
+
Aenean bibendum varius nisi ut molestie Nam tempus nec lacus eget malesuada Donec et accumsan dolor et ullamcorper ante
|
19
|
+
Etiam quis consectetur leo Suspendisse mattis sagittis imperdiet Phasellus facilisis eget justo ac mollis
|
20
|
+
Phasellus eleifend tortor est sit amet venenatis enim fringilla id Vestibulum rutrum tempus tortor ac volutpat
|
21
|
+
Nullam non imperdiet lorem Cras tincidunt porttitor condimentum Pellentesque tincidunt magna id aliquet interdum augue
|
22
|
+
nisl convallis enim volutpat mollis urna metus et lacus Donec tortor sapien ultrices sit amet blandit quis gravida ut
|
23
|
+
massa Mauris mauris lacus pretium sit amet risus quis blandit viverra lorem Nunc fringilla elit a elementum gravida
|
24
|
+
Duis vel sodales elit eget tempor leo Quisque in semper nisl Fusce eget risus sollicitudin molestie diam et tincidunt
|
25
|
+
sem Curabitur accumsan pretium interdum Suspendisse semper enim ac augue hendrerit vel sollicitudin diam mollis
|
26
|
+
Curabitur lacinia ante nec eros maximus a vehicula velit aliquet In ullamcorper nec ante eu dictum Proin mi enim
|
27
|
+
malesuada ut ornare sit amet maximus commodo ipsum Nullam venenatis purus non sollicitudin sollicitudin augue
|
28
|
+
augue euismod lorem ut hendrerit velit neque sed nibh Class aptent taciti sociosqu ad litora torquent per conubia
|
29
|
+
nostra per inceptos himenaeos Proin ac elementum nisl
|
30
|
+
ANONTEXT
|
31
|
+
|
32
|
+
@codedWords = {}
|
33
|
+
|
34
|
+
def initialize
|
35
|
+
@anonWords = @@anonymousText.gsub(/\n/,' ').split
|
36
|
+
@coded = {}
|
37
|
+
@low = 0
|
38
|
+
@limit = @anonWords.length-1
|
39
|
+
@rand = Random.new
|
40
|
+
@minWords = 2
|
41
|
+
@maxWords = 4
|
42
|
+
end
|
43
|
+
|
44
|
+
def anonymize(input, fields, output)
|
45
|
+
puts "Anonymizing %-25s to %-25s - %s " % [input, output, fields.inspect]
|
46
|
+
raise 'The input file must be specified' if input.nil?
|
47
|
+
raise 'The input file must exist' unless File.exist?(input)
|
48
|
+
raise 'The field(s) to anonymize must be provided as a String or an array of Strings' unless fields.instance_of?(String) || fields.instance_of?(Array)
|
49
|
+
@input = input
|
50
|
+
@output = output
|
51
|
+
@anonVals = {}
|
52
|
+
csvFields = CSV.open(@input, &:readline)
|
53
|
+
output = CSV.open(@output,'w')
|
54
|
+
output << csvFields
|
55
|
+
fields = [fields] if fields.is_a? String
|
56
|
+
CSV.foreach('input.csv', :headers => true) do |row|
|
57
|
+
puts "--"
|
58
|
+
fields.each do |field|
|
59
|
+
puts "fld: #{field}"
|
60
|
+
puts "pre: #{row.inspect}"
|
61
|
+
row[field] = anonWords(row[field]) unless row[field].nil?
|
62
|
+
puts "pst: #{row.inspect}"
|
63
|
+
end
|
64
|
+
output << row
|
65
|
+
end
|
66
|
+
end
|
67
|
+
|
68
|
+
def anonWords value
|
69
|
+
return @anonVals[value] unless @anonVals[value].nil?
|
70
|
+
range = rand(@minWords..@maxWords)
|
71
|
+
limit = @limit - range
|
72
|
+
first = rand(range..limit)
|
73
|
+
last = first + range - 1
|
74
|
+
words = @anonWords[first..last].join(' ')
|
75
|
+
@anonVals[value] = words
|
76
|
+
end
|
77
|
+
|
78
|
+
def codeValue value
|
79
|
+
if @codedWords[value].nil?
|
80
|
+
@codedWords[value] = anonWords
|
81
|
+
end
|
82
|
+
@codedWords[value]
|
83
|
+
end
|
84
|
+
|
85
|
+
|
86
|
+
end # class Anonymizer
|
data/lib/tabtools.rb
ADDED
@@ -0,0 +1,22 @@
|
|
1
|
+
# Copyright (C) 2014, 2018 Chris Gerrard
|
2
|
+
#
|
3
|
+
# This program is free software: you can redistribute it and/or modify
|
4
|
+
# it under the terms of the GNU General Public License as published by
|
5
|
+
# the Free Software Foundation, either version 3 of the License, or
|
6
|
+
# (at your option) any later version.
|
7
|
+
#
|
8
|
+
# This program is distributed in the hope that it will be useful,
|
9
|
+
# but WITHOUT ANY WARRANTY; without even the implied warranty of
|
10
|
+
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
11
|
+
# GNU General Public License for more details.
|
12
|
+
#
|
13
|
+
# You should have received a copy of the GNU General Public License
|
14
|
+
# along with this program. If not, see <http://www.gnu.org/licenses/>.
|
15
|
+
|
16
|
+
require_relative 'tabtools/utilities/anonymizer'
|
17
|
+
|
18
|
+
# Represents Tableau Workbooks and their contents.
|
19
|
+
#
|
20
|
+
module TabTools
|
21
|
+
VERSION = '0.0.1'
|
22
|
+
end
|
metadata
ADDED
@@ -0,0 +1,50 @@
|
|
1
|
+
--- !ruby/object:Gem::Specification
|
2
|
+
name: tabtools
|
3
|
+
version: !ruby/object:Gem::Version
|
4
|
+
version: 0.0.1
|
5
|
+
platform: ruby
|
6
|
+
authors:
|
7
|
+
- Chris Gerrard
|
8
|
+
autorequire:
|
9
|
+
bindir: bin
|
10
|
+
cert_chain: []
|
11
|
+
date: 2018-02-01 00:00:00.000000000 Z
|
12
|
+
dependencies: []
|
13
|
+
description: A collection of Ruby classes designed for accessing and recording information
|
14
|
+
about, producing documentation about, and for manipulating Tableau Workbooks and
|
15
|
+
their contents.
|
16
|
+
email: Chris@Gerrard.net
|
17
|
+
executables: []
|
18
|
+
extensions: []
|
19
|
+
extra_rdoc_files: []
|
20
|
+
files:
|
21
|
+
- LICENSE.md
|
22
|
+
- LICENSE.txt
|
23
|
+
- README.md
|
24
|
+
- lib/tabtools.rb
|
25
|
+
- lib/tabtools/utilities/anonymizer.rb
|
26
|
+
homepage: http://rubygems.org/gems/tabtools
|
27
|
+
licenses:
|
28
|
+
- GPL-3.0
|
29
|
+
metadata: {}
|
30
|
+
post_install_message:
|
31
|
+
rdoc_options: []
|
32
|
+
require_paths:
|
33
|
+
- lib
|
34
|
+
required_ruby_version: !ruby/object:Gem::Requirement
|
35
|
+
requirements:
|
36
|
+
- - ">="
|
37
|
+
- !ruby/object:Gem::Version
|
38
|
+
version: '0'
|
39
|
+
required_rubygems_version: !ruby/object:Gem::Requirement
|
40
|
+
requirements:
|
41
|
+
- - ">="
|
42
|
+
- !ruby/object:Gem::Version
|
43
|
+
version: '0'
|
44
|
+
requirements: []
|
45
|
+
rubyforge_project:
|
46
|
+
rubygems_version: 2.6.13
|
47
|
+
signing_key:
|
48
|
+
specification_version: 4
|
49
|
+
summary: Classes for analyzing, documenting, and managing Tableau Workbooks.
|
50
|
+
test_files: []
|