imw 0.2.18 → 0.3.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- data/Gemfile +7 -26
- data/Gemfile.lock +13 -38
- data/{LICENSE → LICENSE.txt} +1 -1
- data/README.textile +35 -0
- data/Rakefile +45 -22
- data/VERSION +1 -1
- data/examples/foo.rb +19 -0
- data/examples/html_selector.rb +22 -0
- data/examples/nes_game_list.csv +625 -0
- data/examples/nes_gamespot.csv +1371 -0
- data/examples/nes_nintendo.csv +624 -0
- data/examples/nes_unlicensed.csv +89 -0
- data/examples/nes_wikipedia.csv +710 -0
- data/examples/nibbler_test.rb +24 -0
- data/examples/script.rb +19 -0
- data/lib/imw.rb +28 -140
- data/lib/imw/error.rb +9 -0
- data/lib/imw/recordizer.rb +8 -0
- data/lib/imw/recordizer/html_selector_recordizer.rb +86 -0
- data/lib/imw/recordizer/string_slice_recordizer.rb +39 -0
- data/lib/imw/resource.rb +3 -119
- data/lib/imw/serializer.rb +7 -0
- data/lib/imw/serializer/json_serializer.rb +17 -0
- data/lib/imw/uri.rb +41 -0
- data/spec/resource_spec.rb +78 -0
- data/spec/uri_spec.rb +55 -0
- metadata +81 -232
- data/README.rdoc +0 -371
- data/bin/imw +0 -5
- data/bin/tsv_to_json.rb +0 -29
- data/etc/imwrc.rb +0 -26
- data/examples/dataset.rb +0 -12
- data/examples/metadata.yml +0 -10
- data/lib/imw/archives.rb +0 -120
- data/lib/imw/archives/rar.rb +0 -19
- data/lib/imw/archives/tar.rb +0 -19
- data/lib/imw/archives/tarbz2.rb +0 -73
- data/lib/imw/archives/targz.rb +0 -73
- data/lib/imw/archives/zip.rb +0 -51
- data/lib/imw/boot.rb +0 -87
- data/lib/imw/compressed_files.rb +0 -94
- data/lib/imw/compressed_files/bz2.rb +0 -16
- data/lib/imw/compressed_files/compressible.rb +0 -75
- data/lib/imw/compressed_files/gz.rb +0 -16
- data/lib/imw/dataset.rb +0 -125
- data/lib/imw/dataset/paths.rb +0 -29
- data/lib/imw/dataset/workflow.rb +0 -195
- data/lib/imw/formats.rb +0 -33
- data/lib/imw/formats/delimited.rb +0 -170
- data/lib/imw/formats/excel.rb +0 -100
- data/lib/imw/formats/json.rb +0 -41
- data/lib/imw/formats/pdf.rb +0 -71
- data/lib/imw/formats/sgml.rb +0 -69
- data/lib/imw/formats/yaml.rb +0 -41
- data/lib/imw/metadata.rb +0 -83
- data/lib/imw/metadata/contains_metadata.rb +0 -54
- data/lib/imw/metadata/dsl.rb +0 -111
- data/lib/imw/metadata/field.rb +0 -37
- data/lib/imw/metadata/has_metadata.rb +0 -98
- data/lib/imw/metadata/has_summary.rb +0 -57
- data/lib/imw/metadata/schema.rb +0 -17
- data/lib/imw/parsers.rb +0 -8
- data/lib/imw/parsers/flat.rb +0 -44
- data/lib/imw/parsers/html_parser.rb +0 -387
- data/lib/imw/parsers/html_parser/matchers.rb +0 -289
- data/lib/imw/parsers/line_parser.rb +0 -87
- data/lib/imw/parsers/regexp_parser.rb +0 -72
- data/lib/imw/repository.rb +0 -12
- data/lib/imw/runner.rb +0 -118
- data/lib/imw/schemes.rb +0 -23
- data/lib/imw/schemes/ftp.rb +0 -142
- data/lib/imw/schemes/hdfs.rb +0 -251
- data/lib/imw/schemes/http.rb +0 -165
- data/lib/imw/schemes/local.rb +0 -409
- data/lib/imw/schemes/remote.rb +0 -119
- data/lib/imw/schemes/s3.rb +0 -143
- data/lib/imw/schemes/sql.rb +0 -129
- data/lib/imw/tools.rb +0 -12
- data/lib/imw/tools/aggregator.rb +0 -148
- data/lib/imw/tools/archiver.rb +0 -220
- data/lib/imw/tools/downloader.rb +0 -63
- data/lib/imw/tools/extension_analyzer.rb +0 -114
- data/lib/imw/tools/summarizer.rb +0 -83
- data/lib/imw/tools/transferer.rb +0 -167
- data/lib/imw/utils.rb +0 -74
- data/lib/imw/utils/dynamically_extendable.rb +0 -137
- data/lib/imw/utils/error.rb +0 -59
- data/lib/imw/utils/extensions/hpricot.rb +0 -34
- data/lib/imw/utils/has_uri.rb +0 -131
- data/lib/imw/utils/log.rb +0 -92
- data/lib/imw/utils/misc.rb +0 -57
- data/lib/imw/utils/paths.rb +0 -146
- data/lib/imw/utils/uri.rb +0 -59
- data/lib/imw/utils/uuid.rb +0 -33
- data/lib/imw/utils/validate.rb +0 -38
- data/lib/imw/utils/version.rb +0 -11
- data/spec/data/formats/delimited/sample.csv +0 -131
- data/spec/data/formats/delimited/sample.tsv +0 -131
- data/spec/data/formats/delimited/with_schema/ace-hardware-locations.tsv +0 -11
- data/spec/data/formats/delimited/with_schema/all-countries-ip-address-to-geolocation-data.tsv +0 -16
- data/spec/data/formats/delimited/with_schema/complete-list-of-starbucks-locations.tsv +0 -11
- data/spec/data/formats/delimited/with_schema/myspace-user-activity-stream-cumulative-word-count-from-from-dec.tsv +0 -22
- data/spec/data/formats/delimited/with_schema/myspace-user-activity-stream-myspace-application-adds-by-zip-cod.tsv +0 -22
- data/spec/data/formats/delimited/with_schema/myspace-user-activity-stream-myspace-application-counts.tsv +0 -12
- data/spec/data/formats/delimited/with_schema/myspace-user-activity-stream-user-count-by-latlong.tsv +0 -13
- data/spec/data/formats/delimited/with_schema/myspace-user-activity-stream-user-count-by-zip-code.tsv +0 -22
- data/spec/data/formats/delimited/with_schema/myspace-user-activity-stream-word-count-by-day-from-december-200.tsv +0 -22
- data/spec/data/formats/delimited/without_schema/ace-hardware-locations.tsv +0 -10
- data/spec/data/formats/delimited/without_schema/all-countries-ip-address-to-geolocation-data.tsv +0 -15
- data/spec/data/formats/delimited/without_schema/complete-list-of-starbucks-locations.tsv +0 -10
- data/spec/data/formats/delimited/without_schema/myspace-user-activity-stream-cumulative-word-count-from-from-dec.tsv +0 -21
- data/spec/data/formats/delimited/without_schema/myspace-user-activity-stream-myspace-application-adds-by-zip-cod.tsv +0 -21
- data/spec/data/formats/delimited/without_schema/myspace-user-activity-stream-myspace-application-counts.tsv +0 -11
- data/spec/data/formats/delimited/without_schema/myspace-user-activity-stream-user-count-by-latlong.tsv +0 -12
- data/spec/data/formats/delimited/without_schema/myspace-user-activity-stream-user-count-by-zip-code.tsv +0 -21
- data/spec/data/formats/delimited/without_schema/myspace-user-activity-stream-word-count-by-day-from-december-200.tsv +0 -21
- data/spec/data/formats/excel/sample.xls +0 -0
- data/spec/data/formats/json/sample.json +0 -1
- data/spec/data/formats/none/sample +0 -650
- data/spec/data/formats/sgml/sample.xml +0 -617
- data/spec/data/formats/text/sample.txt +0 -650
- data/spec/data/formats/yaml/sample.yaml +0 -410
- data/spec/data/schema-tabular.yaml +0 -11
- data/spec/imw/archives/rar_spec.rb +0 -16
- data/spec/imw/archives/tar_spec.rb +0 -16
- data/spec/imw/archives/tarbz2_spec.rb +0 -24
- data/spec/imw/archives/targz_spec.rb +0 -21
- data/spec/imw/archives/zip_spec.rb +0 -16
- data/spec/imw/archives_spec.rb +0 -77
- data/spec/imw/compressed_files/bz2_spec.rb +0 -15
- data/spec/imw/compressed_files/compressible_spec.rb +0 -36
- data/spec/imw/compressed_files/gz_spec.rb +0 -15
- data/spec/imw/compressed_files_spec.rb +0 -47
- data/spec/imw/dataset/paths_spec.rb +0 -32
- data/spec/imw/dataset/workflow_spec.rb +0 -41
- data/spec/imw/formats/delimited_spec.rb +0 -44
- data/spec/imw/formats/excel_spec.rb +0 -55
- data/spec/imw/formats/json_spec.rb +0 -18
- data/spec/imw/formats/sgml_spec.rb +0 -24
- data/spec/imw/formats/yaml_spec.rb +0 -19
- data/spec/imw/metadata/contains_metadata_spec.rb +0 -56
- data/spec/imw/metadata/field_spec.rb +0 -25
- data/spec/imw/metadata/has_metadata_spec.rb +0 -58
- data/spec/imw/metadata/has_summary_spec.rb +0 -32
- data/spec/imw/metadata/schema_spec.rb +0 -24
- data/spec/imw/metadata_spec.rb +0 -86
- data/spec/imw/parsers/line_parser_spec.rb +0 -96
- data/spec/imw/parsers/regexp_parser_spec.rb +0 -42
- data/spec/imw/resource_spec.rb +0 -32
- data/spec/imw/schemes/hdfs_spec.rb +0 -67
- data/spec/imw/schemes/http_spec.rb +0 -19
- data/spec/imw/schemes/local_spec.rb +0 -165
- data/spec/imw/schemes/remote_spec.rb +0 -38
- data/spec/imw/schemes/s3_spec.rb +0 -31
- data/spec/imw/schemes/sql_spec.rb +0 -3
- data/spec/imw/tools/aggregator_spec.rb +0 -71
- data/spec/imw/tools/archiver_spec.rb +0 -120
- data/spec/imw/tools/extension_analyzer_spec.rb +0 -153
- data/spec/imw/tools/summarizer_spec.rb +0 -8
- data/spec/imw/tools/transferer_spec.rb +0 -195
- data/spec/imw/utils/dynamically_extendable_spec.rb +0 -69
- data/spec/imw/utils/has_uri_spec.rb +0 -61
- data/spec/imw/utils/paths_spec.rb +0 -10
- data/spec/imw/utils/shared_paths_spec.rb +0 -29
- data/spec/imw_spec.rb +0 -14
- data/spec/rcov.opts +0 -1
- data/spec/spec_helper.rb +0 -31
- data/spec/support/custom_matchers.rb +0 -28
- data/spec/support/file_contents_matcher.rb +0 -30
- data/spec/support/paths_matcher.rb +0 -66
- data/spec/support/random.rb +0 -213
- data/spec/support/without_regard_to_order_matcher.rb +0 -41
data/lib/imw/utils/uuid.rb
DELETED
|
@@ -1,33 +0,0 @@
|
|
|
1
|
-
require 'uuidtools'
|
|
2
|
-
|
|
3
|
-
class UUID
|
|
4
|
-
|
|
5
|
-
#
|
|
6
|
-
# A string suitable for using as a path name --
|
|
7
|
-
#
|
|
8
|
-
# Ex.
|
|
9
|
-
# urn:uuid:3c0dce44-80a8-11dd-a897-001ff35a0a8b =>
|
|
10
|
-
# urn_uuid/3c0dce44/80a8/11dd/a897/001ff35a0a8b
|
|
11
|
-
#
|
|
12
|
-
# It's well possible there are more perspicacious choices for points to split
|
|
13
|
-
# the string, but until we hit that limit this'll do.
|
|
14
|
-
#
|
|
15
|
-
def to_path
|
|
16
|
-
'urn_uuid/' + to_s.gsub(/[\:\-]/,'/')
|
|
17
|
-
end
|
|
18
|
-
|
|
19
|
-
def self.hex_to_str str
|
|
20
|
-
/([\da-f]{8})([\da-f]{4})([\da-f]{4})([\da-f]{4})([\da-f]{12})/.match(str).captures.join '-'
|
|
21
|
-
end
|
|
22
|
-
|
|
23
|
-
|
|
24
|
-
def self.parse_hex str
|
|
25
|
-
parse(UUID.hex_to_str(str))
|
|
26
|
-
end
|
|
27
|
-
|
|
28
|
-
# Overrides UUIDTools -- force 32 hex digits (leading zeros)
|
|
29
|
-
def hexdigest
|
|
30
|
-
"%032x" % self.to_i
|
|
31
|
-
end
|
|
32
|
-
|
|
33
|
-
end
|
data/lib/imw/utils/validate.rb
DELETED
|
@@ -1,38 +0,0 @@
|
|
|
1
|
-
|
|
2
|
-
|
|
3
|
-
# Return true if <tt>email</tt> is a valid email address
|
|
4
|
-
def is_email?(email)
|
|
5
|
-
raise ArgumentError, "'email' must be a string" if email.class != String
|
|
6
|
-
return false if email.empty?
|
|
7
|
-
|
|
8
|
-
parts = email.split('@')
|
|
9
|
-
return false if parts.size != 2
|
|
10
|
-
|
|
11
|
-
local = parts.first
|
|
12
|
-
return false if not local =~ /[a-zA-Z0-9_~=+-.]*/ # allowed characters
|
|
13
|
-
return false if local[0,1] == '.' # starts with .
|
|
14
|
-
return false if local[-1,1] == '.' # end with .
|
|
15
|
-
return false if local.include?('..') # can't repeat .
|
|
16
|
-
|
|
17
|
-
domain = parts.last
|
|
18
|
-
return false if not is_domain?(domain)
|
|
19
|
-
|
|
20
|
-
return true
|
|
21
|
-
end
|
|
22
|
-
|
|
23
|
-
# Return true if <tt>domain</tt> is a valid domain name
|
|
24
|
-
def is_domain?(domain)
|
|
25
|
-
raise ArgumentError, "'domain' must be a string" if domain.class != String
|
|
26
|
-
return false if domain.empty?
|
|
27
|
-
|
|
28
|
-
return false if domain.size > 255 # max number of characters in a domain
|
|
29
|
-
return false if not domain =~ /^[a-zA-Z0-9.\-]+$/ # allowed characters
|
|
30
|
-
parts = domain.split('.')
|
|
31
|
-
return false if parts.size > 127 # max number of subdomains
|
|
32
|
-
parts.all? {|part| return false if part.size > 63} # max number of characters in a subdomain
|
|
33
|
-
|
|
34
|
-
return true
|
|
35
|
-
end
|
|
36
|
-
|
|
37
|
-
|
|
38
|
-
# puts "#{File.basename(__FILE__)}: As you shape your body to the confines of your container you feel a tremendous sense of validation." # at bottom
|
data/lib/imw/utils/version.rb
DELETED
|
@@ -1,131 +0,0 @@
|
|
|
1
|
-
ID,Name,Genus,Species
|
|
2
|
-
001,Gray-bellied Night Monkey,Aotus,lemurinus
|
|
3
|
-
002,Panamanian Night Monkey,Aotus,zonalis
|
|
4
|
-
003,Hernández-Camacho's Night Monkey,Aotus,jorgehernandezi
|
|
5
|
-
004,Gray-handed Night Monkey,Aotus,griseimembra
|
|
6
|
-
005,Hershkovitz's Night Monkey,Aotus,hershkovitzi
|
|
7
|
-
006,Brumback's Night Monkey,Aotus,brumbacki
|
|
8
|
-
007,Three-striped Night Monkey,Aotus,trivirgatus
|
|
9
|
-
008,Spix's Night Monkey,Aotus,vociferans
|
|
10
|
-
009,Malaysian Lar Gibbon,Hylobates,lar lar
|
|
11
|
-
010,Carpenter's Lar Gibbon,Hylobates,lar carpenteri
|
|
12
|
-
011,Central Lar Gibbon,Hylobates,lar entelloides
|
|
13
|
-
012,Sumatran Lar Gibbon,Hylobates,lar vestitus
|
|
14
|
-
013,Yunnan Lar Gibbon,Hylobates,lar yunnanensis
|
|
15
|
-
014,Mountain Agile Gibbon,Hylobates,agilis agilis
|
|
16
|
-
015,Bornean White-bearded Gibbon,Hylobates,agilis albibarbis
|
|
17
|
-
016,Lowland Agile Gibbon,Hylobates,agilis unko
|
|
18
|
-
017,Müller's Gray Gibbon,Hylobates,muelleri muelleri
|
|
19
|
-
018,Abbott's Gray Gibbon,Hylobates,muelleri abbotti
|
|
20
|
-
019,Northern Gray Gibbon,Hylobates,muelleri funereus
|
|
21
|
-
020,Black Tamarin,Saguinas,niger
|
|
22
|
-
021,Black-mantled Tamarin,Saguinas,nigricollis
|
|
23
|
-
022,Brown-mantled Tamarin,Saguinas,fuscicollis
|
|
24
|
-
023,Cottontop Tamarin or Pinché Tamarin,Saguinas,oedipus
|
|
25
|
-
024,Emperor Tamarin,Saguinas,imperator
|
|
26
|
-
025,Geoffroy's Tamarin,Saguinas,geoffroyi
|
|
27
|
-
026,Golden-mantled Tamarin,Saguinas,tripartitus
|
|
28
|
-
027,Graells's Tamarin,Saguinas,graellsi
|
|
29
|
-
028,Martins's Tamarin,Saguinas,martinsi
|
|
30
|
-
029,Mottle-faced Tamarin,Saguinas,inustus
|
|
31
|
-
030,Moustached Tamarin,Saguinas,mystax
|
|
32
|
-
031,Pied Tamarin,Saguinas,bicolor
|
|
33
|
-
032,Red-capped Tamarin,Saguinas,pileatus
|
|
34
|
-
033,Red-handed Tamarin,Saguinas,midas
|
|
35
|
-
034,White-footed Tamarin,Saguinas,leucopus
|
|
36
|
-
035,White-lipped Tamarin,Saguinas,labiatus
|
|
37
|
-
036,White-mantled Tamarin,Saguinas,melanoleucus
|
|
38
|
-
037,Allen's Swamp Monkey,Allenopithecus,nigroviridis
|
|
39
|
-
038,Angolan Talapoin,Miopithecus,talapoin
|
|
40
|
-
039,Gabon Talapoin,Miopithecus,ogouensis
|
|
41
|
-
040,Patas Monkey,Erythrocebus,patas
|
|
42
|
-
041,Green Monkey,Chlorocebus,sabaeus
|
|
43
|
-
042,Grivet,Chlorocebus,aethiops
|
|
44
|
-
043,Bale Mountains Vervet,Chlorocebus,djamdjamensis
|
|
45
|
-
044,Tantalus Monkey,Chlorocebus,tantalus
|
|
46
|
-
045,Vervet Monkey,Chlorocebus,pygerythrus
|
|
47
|
-
046,Malbrouck,Chlorocebus,cynosuros
|
|
48
|
-
047,Dryas Monkey or Salongo Monkey,Cercopithecus,dryas
|
|
49
|
-
048,Diana Monkey,Cercopithecus,diana
|
|
50
|
-
049,Roloway Monkey,Cercopithecus,roloway
|
|
51
|
-
050,Greater Spot-nosed Monkey,Cercopithecus,nictitans
|
|
52
|
-
051,Blue Monkey,Cercopithecus,mitis
|
|
53
|
-
052,Silver Monkey,Cercopithecus,doggetti
|
|
54
|
-
053,Golden Monkey,Cercopithecus,kandti
|
|
55
|
-
054,Sykes's Monkey,Cercopithecus,albogularis
|
|
56
|
-
055,Mona Monkey,Cercopithecus,mona
|
|
57
|
-
056,Campbell's Mona Monkey,Cercopithecus,campbelli
|
|
58
|
-
057,Lowe's Mona Monkey,Cercopithecus,lowei
|
|
59
|
-
058,Crested Mona Monkey,Cercopithecus,pogonias
|
|
60
|
-
059,Wolf's Mona Monkey,Cercopithecus,wolfi
|
|
61
|
-
060,Dent's Mona Monkey,Cercopithecus,denti
|
|
62
|
-
061,Lesser Spot-nosed Monkey,Cercopithecus,petaurista
|
|
63
|
-
062,White-throated Guenon,Cercopithecus,erythrogaster
|
|
64
|
-
063,Sclater's Guenon,Cercopithecus,sclateri
|
|
65
|
-
064,Red-eared Guenon,Cercopithecus,erythrotis
|
|
66
|
-
065,Moustached Guenon,Cercopithecus,cephus
|
|
67
|
-
066,Red-tailed Monkey,Cercopithecus,ascanius
|
|
68
|
-
067,L'Hoest's Monkey,Cercopithecus,lhoesti
|
|
69
|
-
068,Preuss's Monkey,Cercopithecus,preussi
|
|
70
|
-
069,Sun-tailed Monkey,Cercopithecus,solatus
|
|
71
|
-
070,Hamlyn's Monkey,Cercopithecus,hamlyni
|
|
72
|
-
071,De Brazza's Monkey,Cercopithecus,neglectus
|
|
73
|
-
072,Barbary Macaque,Macaca,sylvanus
|
|
74
|
-
073,Lion-tailed Macaque,Macaca,silenus
|
|
75
|
-
074,Southern Pig-tailed Macaque or Beruk,Macaca,nemestrina
|
|
76
|
-
075,Northern Pig-tailed Macaque,Macaca,leonina
|
|
77
|
-
076,Pagai Island Macaque or Bokkoi,Macaca,pagensis
|
|
78
|
-
077,Siberut Macaque,Macaca,siberu
|
|
79
|
-
078,Moor Macaque,Macaca,maura
|
|
80
|
-
079,Booted Macaque,Macaca,ochreata
|
|
81
|
-
080,Tonkean Macaque,Macaca,tonkeana
|
|
82
|
-
081,Heck's Macaque,Macaca,hecki
|
|
83
|
-
082,Gorontalo Macaque,Macaca,nigrescens
|
|
84
|
-
083,Celebes Crested Macaque or Black Ape,Macaca,nigra
|
|
85
|
-
084,Crab-eating Macaque or Long-tailed Macaque or Kera,Macaca,fascicularis
|
|
86
|
-
085,Stump-tailed Macaque or Bear Macaque,Macaca,arctoides
|
|
87
|
-
086,Rhesus Macaque,Macaca,mulatta
|
|
88
|
-
087,Formosan Rock Macaque,Macaca,cyclopis
|
|
89
|
-
088,Japanese Macaque,Macaca,fuscata
|
|
90
|
-
089,Toque Macaque,Macaca,sinica
|
|
91
|
-
090,Bonnet Macaque,Macaca,radiata
|
|
92
|
-
091,Assam Macaque,Macaca,assamensis
|
|
93
|
-
092,Tibetan Macaque or Milne-Edwards' Macaque,Macaca,thibetana
|
|
94
|
-
093,Arunachal Macaque or Munzala,Macaca,munzala
|
|
95
|
-
094,Grey-cheeked Mangabey,Lophocebus,albigena
|
|
96
|
-
095,Black Crested Mangabey,Lophocebus,aterrimus
|
|
97
|
-
096,Opdenbosch's Mangabey,Lophocebus,opdenboschi
|
|
98
|
-
097,Uganda Mangabey,Lophocebus,ugandae
|
|
99
|
-
098,Johnston's Mangabey,Lophocebus,johnstoni
|
|
100
|
-
099,Osman Hill's Mangabey,Lophocebus,osmani
|
|
101
|
-
100,Kipunji,Rungwecebus,kipunji
|
|
102
|
-
101,Hamadryas Baboon,Papio,hamadryas
|
|
103
|
-
102,Guinea Baboon,Papio,papio
|
|
104
|
-
103,Olive Baboon,Papio,anubis
|
|
105
|
-
104,Yellow Baboon,Papio,cynocephalus
|
|
106
|
-
105,Chacma Baboon,Papio,ursinus
|
|
107
|
-
106,Gelada,Theropithecus,gelada
|
|
108
|
-
107,Sooty Mangabey,Cercocebus,atys
|
|
109
|
-
108,Collared Mangabey,Cercocebus,torquatus
|
|
110
|
-
109,Agile Mangabey,Cercocebus,agilis
|
|
111
|
-
110,Golden-bellied Mangabey,Cercocebus,chrysogaster
|
|
112
|
-
111,Tana River Mangabey,Cercocebus,galeritus
|
|
113
|
-
112,Sanje Mangabey,Cercocebus,sanjei
|
|
114
|
-
113,Mandrill,Mandrillus,sphinx
|
|
115
|
-
114,Drill,Mandrillus,leucophaeus
|
|
116
|
-
115,Black Colobus,Colobus,satanas
|
|
117
|
-
116,Angola Colobus,Colobus,angolensis
|
|
118
|
-
117,King Colobus,Colobus,polykomos
|
|
119
|
-
118,Ursine Colobus,Colobus,vellerosus
|
|
120
|
-
119,Mantled Guereza,Colobus,guereza
|
|
121
|
-
120,Western Red Colobus,Piliocolobus,badius
|
|
122
|
-
121,Pennant's Colobus,Piliocolobus,pennantii
|
|
123
|
-
122,Preuss's Red Colobus,Piliocolobus,preussi
|
|
124
|
-
123,Thollon's Red Colobus,Piliocolobus,tholloni
|
|
125
|
-
124,Central African Red Colobus,Piliocolobus,foai
|
|
126
|
-
125,Ugandan Red Colobus,Piliocolobus,tephrosceles
|
|
127
|
-
126,Uzungwa Red Colobus,Piliocolobus,gordonorum
|
|
128
|
-
127,Zanzibar Red Colobus,Piliocolobus,kirkii
|
|
129
|
-
128,Tana River Red Colobus,Piliocolobus,rufomitratus
|
|
130
|
-
129,Olive Colobus,Procolobus,verus
|
|
131
|
-
130,Maroon Leaf Monkey,Presbytis,rubicunda
|
|
@@ -1,131 +0,0 @@
|
|
|
1
|
-
ID Name Genus Species
|
|
2
|
-
001 Gray-bellied Night Monkey Aotus lemurinus
|
|
3
|
-
002 Panamanian Night Monkey Aotus zonalis
|
|
4
|
-
003 Hernández-Camacho's Night Monkey Aotus jorgehernandezi
|
|
5
|
-
004 Gray-handed Night Monkey Aotus griseimembra
|
|
6
|
-
005 Hershkovitz's Night Monkey Aotus hershkovitzi
|
|
7
|
-
006 Brumback's Night Monkey Aotus brumbacki
|
|
8
|
-
007 Three-striped Night Monkey Aotus trivirgatus
|
|
9
|
-
008 Spix's Night Monkey Aotus vociferans
|
|
10
|
-
009 Malaysian Lar Gibbon Hylobates lar lar
|
|
11
|
-
010 Carpenter's Lar Gibbon Hylobates lar carpenteri
|
|
12
|
-
011 Central Lar Gibbon Hylobates lar entelloides
|
|
13
|
-
012 Sumatran Lar Gibbon Hylobates lar vestitus
|
|
14
|
-
013 Yunnan Lar Gibbon Hylobates lar yunnanensis
|
|
15
|
-
014 Mountain Agile Gibbon Hylobates agilis agilis
|
|
16
|
-
015 Bornean White-bearded Gibbon Hylobates agilis albibarbis
|
|
17
|
-
016 Lowland Agile Gibbon Hylobates agilis unko
|
|
18
|
-
017 Müller's Gray Gibbon Hylobates muelleri muelleri
|
|
19
|
-
018 Abbott's Gray Gibbon Hylobates muelleri abbotti
|
|
20
|
-
019 Northern Gray Gibbon Hylobates muelleri funereus
|
|
21
|
-
020 Black Tamarin Saguinas niger
|
|
22
|
-
021 Black-mantled Tamarin Saguinas nigricollis
|
|
23
|
-
022 Brown-mantled Tamarin Saguinas fuscicollis
|
|
24
|
-
023 Cottontop Tamarin or Pinché Tamarin Saguinas oedipus
|
|
25
|
-
024 Emperor Tamarin Saguinas imperator
|
|
26
|
-
025 Geoffroy's Tamarin Saguinas geoffroyi
|
|
27
|
-
026 Golden-mantled Tamarin Saguinas tripartitus
|
|
28
|
-
027 Graells's Tamarin Saguinas graellsi
|
|
29
|
-
028 Martins's Tamarin Saguinas martinsi
|
|
30
|
-
029 Mottle-faced Tamarin Saguinas inustus
|
|
31
|
-
030 Moustached Tamarin Saguinas mystax
|
|
32
|
-
031 Pied Tamarin Saguinas bicolor
|
|
33
|
-
032 Red-capped Tamarin Saguinas pileatus
|
|
34
|
-
033 Red-handed Tamarin Saguinas midas
|
|
35
|
-
034 White-footed Tamarin Saguinas leucopus
|
|
36
|
-
035 White-lipped Tamarin Saguinas labiatus
|
|
37
|
-
036 White-mantled Tamarin Saguinas melanoleucus
|
|
38
|
-
037 Allen's Swamp Monkey Allenopithecus nigroviridis
|
|
39
|
-
038 Angolan Talapoin Miopithecus talapoin
|
|
40
|
-
039 Gabon Talapoin Miopithecus ogouensis
|
|
41
|
-
040 Patas Monkey Erythrocebus patas
|
|
42
|
-
041 Green Monkey Chlorocebus sabaeus
|
|
43
|
-
042 Grivet Chlorocebus aethiops
|
|
44
|
-
043 Bale Mountains Vervet Chlorocebus djamdjamensis
|
|
45
|
-
044 Tantalus Monkey Chlorocebus tantalus
|
|
46
|
-
045 Vervet Monkey Chlorocebus pygerythrus
|
|
47
|
-
046 Malbrouck Chlorocebus cynosuros
|
|
48
|
-
047 Dryas Monkey or Salongo Monkey Cercopithecus dryas
|
|
49
|
-
048 Diana Monkey Cercopithecus diana
|
|
50
|
-
049 Roloway Monkey Cercopithecus roloway
|
|
51
|
-
050 Greater Spot-nosed Monkey Cercopithecus nictitans
|
|
52
|
-
051 Blue Monkey Cercopithecus mitis
|
|
53
|
-
052 Silver Monkey Cercopithecus doggetti
|
|
54
|
-
053 Golden Monkey Cercopithecus kandti
|
|
55
|
-
054 Sykes's Monkey Cercopithecus albogularis
|
|
56
|
-
055 Mona Monkey Cercopithecus mona
|
|
57
|
-
056 Campbell's Mona Monkey Cercopithecus campbelli
|
|
58
|
-
057 Lowe's Mona Monkey Cercopithecus lowei
|
|
59
|
-
058 Crested Mona Monkey Cercopithecus pogonias
|
|
60
|
-
059 Wolf's Mona Monkey Cercopithecus wolfi
|
|
61
|
-
060 Dent's Mona Monkey Cercopithecus denti
|
|
62
|
-
061 Lesser Spot-nosed Monkey Cercopithecus petaurista
|
|
63
|
-
062 White-throated Guenon Cercopithecus erythrogaster
|
|
64
|
-
063 Sclater's Guenon Cercopithecus sclateri
|
|
65
|
-
064 Red-eared Guenon Cercopithecus erythrotis
|
|
66
|
-
065 Moustached Guenon Cercopithecus cephus
|
|
67
|
-
066 Red-tailed Monkey Cercopithecus ascanius
|
|
68
|
-
067 L'Hoest's Monkey Cercopithecus lhoesti
|
|
69
|
-
068 Preuss's Monkey Cercopithecus preussi
|
|
70
|
-
069 Sun-tailed Monkey Cercopithecus solatus
|
|
71
|
-
070 Hamlyn's Monkey Cercopithecus hamlyni
|
|
72
|
-
071 De Brazza's Monkey Cercopithecus neglectus
|
|
73
|
-
072 Barbary Macaque Macaca sylvanus
|
|
74
|
-
073 Lion-tailed Macaque Macaca silenus
|
|
75
|
-
074 Southern Pig-tailed Macaque or Beruk Macaca nemestrina
|
|
76
|
-
075 Northern Pig-tailed Macaque Macaca leonina
|
|
77
|
-
076 Pagai Island Macaque or Bokkoi Macaca pagensis
|
|
78
|
-
077 Siberut Macaque Macaca siberu
|
|
79
|
-
078 Moor Macaque Macaca maura
|
|
80
|
-
079 Booted Macaque Macaca ochreata
|
|
81
|
-
080 Tonkean Macaque Macaca tonkeana
|
|
82
|
-
081 Heck's Macaque Macaca hecki
|
|
83
|
-
082 Gorontalo Macaque Macaca nigrescens
|
|
84
|
-
083 Celebes Crested Macaque or Black Ape Macaca nigra
|
|
85
|
-
084 Crab-eating Macaque or Long-tailed Macaque or Kera Macaca fascicularis
|
|
86
|
-
085 Stump-tailed Macaque or Bear Macaque Macaca arctoides
|
|
87
|
-
086 Rhesus Macaque Macaca mulatta
|
|
88
|
-
087 Formosan Rock Macaque Macaca cyclopis
|
|
89
|
-
088 Japanese Macaque Macaca fuscata
|
|
90
|
-
089 Toque Macaque Macaca sinica
|
|
91
|
-
090 Bonnet Macaque Macaca radiata
|
|
92
|
-
091 Assam Macaque Macaca assamensis
|
|
93
|
-
092 Tibetan Macaque or Milne-Edwards' Macaque Macaca thibetana
|
|
94
|
-
093 Arunachal Macaque or Munzala Macaca munzala
|
|
95
|
-
094 Grey-cheeked Mangabey Lophocebus albigena
|
|
96
|
-
095 Black Crested Mangabey Lophocebus aterrimus
|
|
97
|
-
096 Opdenbosch's Mangabey Lophocebus opdenboschi
|
|
98
|
-
097 Uganda Mangabey Lophocebus ugandae
|
|
99
|
-
098 Johnston's Mangabey Lophocebus johnstoni
|
|
100
|
-
099 Osman Hill's Mangabey Lophocebus osmani
|
|
101
|
-
100 Kipunji Rungwecebus kipunji
|
|
102
|
-
101 Hamadryas Baboon Papio hamadryas
|
|
103
|
-
102 Guinea Baboon Papio papio
|
|
104
|
-
103 Olive Baboon Papio anubis
|
|
105
|
-
104 Yellow Baboon Papio cynocephalus
|
|
106
|
-
105 Chacma Baboon Papio ursinus
|
|
107
|
-
106 Gelada Theropithecus gelada
|
|
108
|
-
107 Sooty Mangabey Cercocebus atys
|
|
109
|
-
108 Collared Mangabey Cercocebus torquatus
|
|
110
|
-
109 Agile Mangabey Cercocebus agilis
|
|
111
|
-
110 Golden-bellied Mangabey Cercocebus chrysogaster
|
|
112
|
-
111 Tana River Mangabey Cercocebus galeritus
|
|
113
|
-
112 Sanje Mangabey Cercocebus sanjei
|
|
114
|
-
113 Mandrill Mandrillus sphinx
|
|
115
|
-
114 Drill Mandrillus leucophaeus
|
|
116
|
-
115 Black Colobus Colobus satanas
|
|
117
|
-
116 Angola Colobus Colobus angolensis
|
|
118
|
-
117 King Colobus Colobus polykomos
|
|
119
|
-
118 Ursine Colobus Colobus vellerosus
|
|
120
|
-
119 Mantled Guereza Colobus guereza
|
|
121
|
-
120 Western Red Colobus Piliocolobus badius
|
|
122
|
-
121 Pennant's Colobus Piliocolobus pennantii
|
|
123
|
-
122 Preuss's Red Colobus Piliocolobus preussi
|
|
124
|
-
123 Thollon's Red Colobus Piliocolobus tholloni
|
|
125
|
-
124 Central African Red Colobus Piliocolobus foai
|
|
126
|
-
125 Ugandan Red Colobus Piliocolobus tephrosceles
|
|
127
|
-
126 Uzungwa Red Colobus Piliocolobus gordonorum
|
|
128
|
-
127 Zanzibar Red Colobus Piliocolobus kirkii
|
|
129
|
-
128 Tana River Red Colobus Piliocolobus rufomitratus
|
|
130
|
-
129 Olive Colobus Procolobus verus
|
|
131
|
-
130 Maroon Leaf Monkey Presbytis rubicunda
|
|
@@ -1,11 +0,0 @@
|
|
|
1
|
-
Store Number Store Name Address City State Zip Phone Number Latitude Longitude
|
|
2
|
-
10344 Ace Gambles of Hotchkiss 121 E. Bridge Street Hotchkiss CO 81419 (970) 872-3535 38.7988 -107.7205
|
|
3
|
-
10347 Al's Ace Hardware 4010 E 29th St Tucson AZ 85711 (520) 747-8144 32.1996 -110.9059
|
|
4
|
-
10349 Al's Ace Hardware 4722 E Broadway Blvd Tucson AZ 85711 (520) 318-0414 32.2216 -110.8916
|
|
5
|
-
10351 Al's Ace Hardware 2884 N Campbell Ave Tucson AZ 85719 (520) 325-2432 32.259 -110.9428
|
|
6
|
-
10353 Lewistown Ace Hardware 815 NE Main St Lewistown MT 59457 (406) 538-4000 47.0702 -109.409
|
|
7
|
-
10356 Byram Revell Ace Hardware 5726 Terry Rd Jackson MS 39272 (601) 371-8429 32.1919 -90.2542
|
|
8
|
-
10357 Mr C's Ace Hardware 1201 Precinct Line Rd Hurst TX 76053 (817) 282-3428 32.831 -97.186
|
|
9
|
-
10358 Gus Bock Ace Hardware 3455 Ridge Rd Lansing IL 60438 (708) 474-5940 41.5643 -87.5321
|
|
10
|
-
10359 Elberton Ace Hardware 886 Elbert St Elberton GA 30635 (706) 283-3054 34.1008 -82.8495
|
|
11
|
-
10361 Phil's Hardware 13 SW H St Madras OR 97741 (541) 475-9392 44.627737 -121.13004
|
data/spec/data/formats/delimited/with_schema/all-countries-ip-address-to-geolocation-data.tsv
DELETED
|
@@ -1,16 +0,0 @@
|
|
|
1
|
-
IP_BeginNum IP_EndNum IP_SubBlock IP_Begin IP_End Country State City ZipCode Latitude Longitude MetroCode AreaCode
|
|
2
|
-
16777216 16842751 256 1.0.0.0 1.0.255.255 AP 35.0 105.0
|
|
3
|
-
16842752 16908287 257 1.1.0.0 1.1.255.255 AP 35.0 105.0
|
|
4
|
-
16908288 16973823 258 1.2.0.0 1.2.255.255 AP 35.0 105.0
|
|
5
|
-
16973824 17039359 259 1.3.0.0 1.3.255.255 AP 35.0 105.0
|
|
6
|
-
17039360 17104895 260 1.4.0.0 1.4.255.255 AP 35.0 105.0
|
|
7
|
-
17104896 17170431 261 1.5.0.0 1.5.255.255 AP 35.0 105.0
|
|
8
|
-
17170432 17235967 262 1.6.0.0 1.6.255.255 AP 35.0 105.0
|
|
9
|
-
17235968 17301503 263 1.7.0.0 1.7.255.255 AP 35.0 105.0
|
|
10
|
-
17301504 17367039 264 1.8.0.0 1.8.255.255 AP 35.0 105.0
|
|
11
|
-
17367040 17432575 265 1.9.0.0 1.9.255.255 AP 35.0 105.0
|
|
12
|
-
17432576 17498111 266 1.10.0.0 1.10.255.255 AP 35.0 105.0
|
|
13
|
-
17498112 17563647 267 1.11.0.0 1.11.255.255 AP 35.0 105.0
|
|
14
|
-
17563648 17629183 268 1.12.0.0 1.12.255.255 AP 35.0 105.0
|
|
15
|
-
17629184 17694719 269 1.13.0.0 1.13.255.255 AP 35.0 105.0
|
|
16
|
-
17694720 17760255 270 1.14.0.0 1.14.255.255 AP 35.0 105.0
|
|
@@ -1,11 +0,0 @@
|
|
|
1
|
-
Store Number Store Name Address City State Zip Phone Wireless Latitude Longitude
|
|
2
|
-
103704 Grand & Reems, Surprise 18885 N. Reems Road - #105 Surprise AZ 85374 623-584-5015 wireless 33.646084 -112.389903
|
|
3
|
-
98887 Safeway-Sun City West #1520 14505 W Grand Ave Surprise AZ 85374 623-975-4022 33.655002 -112.371358
|
|
4
|
-
97730 Safeway-Surprise #1997 17049 W Bell Rd Surprise AZ 85374 623-518-1059 33.638805 -112.42561
|
|
5
|
-
97179 Safeway-Surprise #2699 13828 W Waddell Rd Surprise AZ 85374 623-476-1810 33.609216 -112.357999
|
|
6
|
-
23371 Albertsons-Tempe AZ #940 750 E Guadalupe Rd Tempe AZ 85283 480-820-8166 33.364742 -111.92974
|
|
7
|
-
78041 Aramark ASU Bookstore 525 E. Orange St. Tempe AZ 85287 480-727-0830 33.418367 -111.931272
|
|
8
|
-
78040 Aramark ASU Business College College of Business 1st Floor Tempe AZ 85287 480-727-0019 33.4148 -111.9088
|
|
9
|
-
78022 Aramark ASU Memorial Union 2090 S Normal Tempe AZ 85287 480-727-7480 33.416721 -111.933296
|
|
10
|
-
94352 Aramark ASU Palo Verde East 340 E University Dr Tempe AZ 85287 480-727-0462 33.421975 -111.934342
|
|
11
|
-
1417 Arizona Mills 5000 Arizona Mills Circle - Suite #391 Tempe AZ 85282 (480) 897-4804 wireless 33.379419 -111.965053
|
|
@@ -1,22 +0,0 @@
|
|
|
1
|
-
Word Count
|
|
2
|
-
accaldata 4
|
|
3
|
-
accaldato 4
|
|
4
|
-
accalia 124
|
|
5
|
-
accallonato 2
|
|
6
|
-
accally 3
|
|
7
|
-
accalmie 5
|
|
8
|
-
accaly 4
|
|
9
|
-
accampato 2
|
|
10
|
-
accanimento 2
|
|
11
|
-
accanisce 4
|
|
12
|
-
accaniti 4
|
|
13
|
-
accanito 3
|
|
14
|
-
accannate 3
|
|
15
|
-
accannato 3
|
|
16
|
-
accant 8
|
|
17
|
-
accanto 135
|
|
18
|
-
accantonate 2
|
|
19
|
-
accaount 7
|
|
20
|
-
accapalla 3
|
|
21
|
-
accapar 6
|
|
22
|
-
accape 2
|
|
@@ -1,22 +0,0 @@
|
|
|
1
|
-
ZIP Code Application Count
|
|
2
|
-
10000 Dragon Wars 9
|
|
3
|
-
10000 SuperPoke Pets 179
|
|
4
|
-
10000 Dancing Bananas_ 75
|
|
5
|
-
10000 digitck 1
|
|
6
|
-
10000 Random Friend Viewer 56
|
|
7
|
-
10000 Daily Horoscope 1
|
|
8
|
-
10000 FARKLE 30
|
|
9
|
-
10000 Chat 12
|
|
10
|
-
10000 Hero World 47
|
|
11
|
-
10000 PinkRibbon 7
|
|
12
|
-
10000 Super Slot Machines 47
|
|
13
|
-
10000 RSS Reader 5
|
|
14
|
-
10000 SexGames 36
|
|
15
|
-
10001 Astrology 18
|
|
16
|
-
10001 Rockstars 3
|
|
17
|
-
10001 Movies 50
|
|
18
|
-
10001 Green Spot 30
|
|
19
|
-
10001 RockYou Pets 95
|
|
20
|
-
10001 Tag Me 1415
|
|
21
|
-
10001 Nitrous Racing 18
|
|
22
|
-
10001 Baby Animals Dressup Tiger 3
|
|
@@ -1,12 +0,0 @@
|
|
|
1
|
-
Application Count
|
|
2
|
-
Addicted to Xena 13
|
|
3
|
-
Addicted to Zoey 101 4
|
|
4
|
-
Addicting Games - Free Kicker 3
|
|
5
|
-
Addiction 10
|
|
6
|
-
Adopt A Pet 176
|
|
7
|
-
Adopt a Friend 660
|
|
8
|
-
Adorable Pet Chinchilla 64
|
|
9
|
-
Adorable Puppies 32
|
|
10
|
-
Adorable Twins 7
|
|
11
|
-
Adorninho against the Tsunami 1
|
|
12
|
-
Adrenaline Challenge 30
|