imw 0.2.18 → 0.3.0
Sign up to get free protection for your applications and to get access to all the features.
- data/Gemfile +7 -26
- data/Gemfile.lock +13 -38
- data/{LICENSE → LICENSE.txt} +1 -1
- data/README.textile +35 -0
- data/Rakefile +45 -22
- data/VERSION +1 -1
- data/examples/foo.rb +19 -0
- data/examples/html_selector.rb +22 -0
- data/examples/nes_game_list.csv +625 -0
- data/examples/nes_gamespot.csv +1371 -0
- data/examples/nes_nintendo.csv +624 -0
- data/examples/nes_unlicensed.csv +89 -0
- data/examples/nes_wikipedia.csv +710 -0
- data/examples/nibbler_test.rb +24 -0
- data/examples/script.rb +19 -0
- data/lib/imw.rb +28 -140
- data/lib/imw/error.rb +9 -0
- data/lib/imw/recordizer.rb +8 -0
- data/lib/imw/recordizer/html_selector_recordizer.rb +86 -0
- data/lib/imw/recordizer/string_slice_recordizer.rb +39 -0
- data/lib/imw/resource.rb +3 -119
- data/lib/imw/serializer.rb +7 -0
- data/lib/imw/serializer/json_serializer.rb +17 -0
- data/lib/imw/uri.rb +41 -0
- data/spec/resource_spec.rb +78 -0
- data/spec/uri_spec.rb +55 -0
- metadata +81 -232
- data/README.rdoc +0 -371
- data/bin/imw +0 -5
- data/bin/tsv_to_json.rb +0 -29
- data/etc/imwrc.rb +0 -26
- data/examples/dataset.rb +0 -12
- data/examples/metadata.yml +0 -10
- data/lib/imw/archives.rb +0 -120
- data/lib/imw/archives/rar.rb +0 -19
- data/lib/imw/archives/tar.rb +0 -19
- data/lib/imw/archives/tarbz2.rb +0 -73
- data/lib/imw/archives/targz.rb +0 -73
- data/lib/imw/archives/zip.rb +0 -51
- data/lib/imw/boot.rb +0 -87
- data/lib/imw/compressed_files.rb +0 -94
- data/lib/imw/compressed_files/bz2.rb +0 -16
- data/lib/imw/compressed_files/compressible.rb +0 -75
- data/lib/imw/compressed_files/gz.rb +0 -16
- data/lib/imw/dataset.rb +0 -125
- data/lib/imw/dataset/paths.rb +0 -29
- data/lib/imw/dataset/workflow.rb +0 -195
- data/lib/imw/formats.rb +0 -33
- data/lib/imw/formats/delimited.rb +0 -170
- data/lib/imw/formats/excel.rb +0 -100
- data/lib/imw/formats/json.rb +0 -41
- data/lib/imw/formats/pdf.rb +0 -71
- data/lib/imw/formats/sgml.rb +0 -69
- data/lib/imw/formats/yaml.rb +0 -41
- data/lib/imw/metadata.rb +0 -83
- data/lib/imw/metadata/contains_metadata.rb +0 -54
- data/lib/imw/metadata/dsl.rb +0 -111
- data/lib/imw/metadata/field.rb +0 -37
- data/lib/imw/metadata/has_metadata.rb +0 -98
- data/lib/imw/metadata/has_summary.rb +0 -57
- data/lib/imw/metadata/schema.rb +0 -17
- data/lib/imw/parsers.rb +0 -8
- data/lib/imw/parsers/flat.rb +0 -44
- data/lib/imw/parsers/html_parser.rb +0 -387
- data/lib/imw/parsers/html_parser/matchers.rb +0 -289
- data/lib/imw/parsers/line_parser.rb +0 -87
- data/lib/imw/parsers/regexp_parser.rb +0 -72
- data/lib/imw/repository.rb +0 -12
- data/lib/imw/runner.rb +0 -118
- data/lib/imw/schemes.rb +0 -23
- data/lib/imw/schemes/ftp.rb +0 -142
- data/lib/imw/schemes/hdfs.rb +0 -251
- data/lib/imw/schemes/http.rb +0 -165
- data/lib/imw/schemes/local.rb +0 -409
- data/lib/imw/schemes/remote.rb +0 -119
- data/lib/imw/schemes/s3.rb +0 -143
- data/lib/imw/schemes/sql.rb +0 -129
- data/lib/imw/tools.rb +0 -12
- data/lib/imw/tools/aggregator.rb +0 -148
- data/lib/imw/tools/archiver.rb +0 -220
- data/lib/imw/tools/downloader.rb +0 -63
- data/lib/imw/tools/extension_analyzer.rb +0 -114
- data/lib/imw/tools/summarizer.rb +0 -83
- data/lib/imw/tools/transferer.rb +0 -167
- data/lib/imw/utils.rb +0 -74
- data/lib/imw/utils/dynamically_extendable.rb +0 -137
- data/lib/imw/utils/error.rb +0 -59
- data/lib/imw/utils/extensions/hpricot.rb +0 -34
- data/lib/imw/utils/has_uri.rb +0 -131
- data/lib/imw/utils/log.rb +0 -92
- data/lib/imw/utils/misc.rb +0 -57
- data/lib/imw/utils/paths.rb +0 -146
- data/lib/imw/utils/uri.rb +0 -59
- data/lib/imw/utils/uuid.rb +0 -33
- data/lib/imw/utils/validate.rb +0 -38
- data/lib/imw/utils/version.rb +0 -11
- data/spec/data/formats/delimited/sample.csv +0 -131
- data/spec/data/formats/delimited/sample.tsv +0 -131
- data/spec/data/formats/delimited/with_schema/ace-hardware-locations.tsv +0 -11
- data/spec/data/formats/delimited/with_schema/all-countries-ip-address-to-geolocation-data.tsv +0 -16
- data/spec/data/formats/delimited/with_schema/complete-list-of-starbucks-locations.tsv +0 -11
- data/spec/data/formats/delimited/with_schema/myspace-user-activity-stream-cumulative-word-count-from-from-dec.tsv +0 -22
- data/spec/data/formats/delimited/with_schema/myspace-user-activity-stream-myspace-application-adds-by-zip-cod.tsv +0 -22
- data/spec/data/formats/delimited/with_schema/myspace-user-activity-stream-myspace-application-counts.tsv +0 -12
- data/spec/data/formats/delimited/with_schema/myspace-user-activity-stream-user-count-by-latlong.tsv +0 -13
- data/spec/data/formats/delimited/with_schema/myspace-user-activity-stream-user-count-by-zip-code.tsv +0 -22
- data/spec/data/formats/delimited/with_schema/myspace-user-activity-stream-word-count-by-day-from-december-200.tsv +0 -22
- data/spec/data/formats/delimited/without_schema/ace-hardware-locations.tsv +0 -10
- data/spec/data/formats/delimited/without_schema/all-countries-ip-address-to-geolocation-data.tsv +0 -15
- data/spec/data/formats/delimited/without_schema/complete-list-of-starbucks-locations.tsv +0 -10
- data/spec/data/formats/delimited/without_schema/myspace-user-activity-stream-cumulative-word-count-from-from-dec.tsv +0 -21
- data/spec/data/formats/delimited/without_schema/myspace-user-activity-stream-myspace-application-adds-by-zip-cod.tsv +0 -21
- data/spec/data/formats/delimited/without_schema/myspace-user-activity-stream-myspace-application-counts.tsv +0 -11
- data/spec/data/formats/delimited/without_schema/myspace-user-activity-stream-user-count-by-latlong.tsv +0 -12
- data/spec/data/formats/delimited/without_schema/myspace-user-activity-stream-user-count-by-zip-code.tsv +0 -21
- data/spec/data/formats/delimited/without_schema/myspace-user-activity-stream-word-count-by-day-from-december-200.tsv +0 -21
- data/spec/data/formats/excel/sample.xls +0 -0
- data/spec/data/formats/json/sample.json +0 -1
- data/spec/data/formats/none/sample +0 -650
- data/spec/data/formats/sgml/sample.xml +0 -617
- data/spec/data/formats/text/sample.txt +0 -650
- data/spec/data/formats/yaml/sample.yaml +0 -410
- data/spec/data/schema-tabular.yaml +0 -11
- data/spec/imw/archives/rar_spec.rb +0 -16
- data/spec/imw/archives/tar_spec.rb +0 -16
- data/spec/imw/archives/tarbz2_spec.rb +0 -24
- data/spec/imw/archives/targz_spec.rb +0 -21
- data/spec/imw/archives/zip_spec.rb +0 -16
- data/spec/imw/archives_spec.rb +0 -77
- data/spec/imw/compressed_files/bz2_spec.rb +0 -15
- data/spec/imw/compressed_files/compressible_spec.rb +0 -36
- data/spec/imw/compressed_files/gz_spec.rb +0 -15
- data/spec/imw/compressed_files_spec.rb +0 -47
- data/spec/imw/dataset/paths_spec.rb +0 -32
- data/spec/imw/dataset/workflow_spec.rb +0 -41
- data/spec/imw/formats/delimited_spec.rb +0 -44
- data/spec/imw/formats/excel_spec.rb +0 -55
- data/spec/imw/formats/json_spec.rb +0 -18
- data/spec/imw/formats/sgml_spec.rb +0 -24
- data/spec/imw/formats/yaml_spec.rb +0 -19
- data/spec/imw/metadata/contains_metadata_spec.rb +0 -56
- data/spec/imw/metadata/field_spec.rb +0 -25
- data/spec/imw/metadata/has_metadata_spec.rb +0 -58
- data/spec/imw/metadata/has_summary_spec.rb +0 -32
- data/spec/imw/metadata/schema_spec.rb +0 -24
- data/spec/imw/metadata_spec.rb +0 -86
- data/spec/imw/parsers/line_parser_spec.rb +0 -96
- data/spec/imw/parsers/regexp_parser_spec.rb +0 -42
- data/spec/imw/resource_spec.rb +0 -32
- data/spec/imw/schemes/hdfs_spec.rb +0 -67
- data/spec/imw/schemes/http_spec.rb +0 -19
- data/spec/imw/schemes/local_spec.rb +0 -165
- data/spec/imw/schemes/remote_spec.rb +0 -38
- data/spec/imw/schemes/s3_spec.rb +0 -31
- data/spec/imw/schemes/sql_spec.rb +0 -3
- data/spec/imw/tools/aggregator_spec.rb +0 -71
- data/spec/imw/tools/archiver_spec.rb +0 -120
- data/spec/imw/tools/extension_analyzer_spec.rb +0 -153
- data/spec/imw/tools/summarizer_spec.rb +0 -8
- data/spec/imw/tools/transferer_spec.rb +0 -195
- data/spec/imw/utils/dynamically_extendable_spec.rb +0 -69
- data/spec/imw/utils/has_uri_spec.rb +0 -61
- data/spec/imw/utils/paths_spec.rb +0 -10
- data/spec/imw/utils/shared_paths_spec.rb +0 -29
- data/spec/imw_spec.rb +0 -14
- data/spec/rcov.opts +0 -1
- data/spec/spec_helper.rb +0 -31
- data/spec/support/custom_matchers.rb +0 -28
- data/spec/support/file_contents_matcher.rb +0 -30
- data/spec/support/paths_matcher.rb +0 -66
- data/spec/support/random.rb +0 -213
- data/spec/support/without_regard_to_order_matcher.rb +0 -41
data/lib/imw/utils/uuid.rb
DELETED
@@ -1,33 +0,0 @@
|
|
1
|
-
require 'uuidtools'
|
2
|
-
|
3
|
-
class UUID
|
4
|
-
|
5
|
-
#
|
6
|
-
# A string suitable for using as a path name --
|
7
|
-
#
|
8
|
-
# Ex.
|
9
|
-
# urn:uuid:3c0dce44-80a8-11dd-a897-001ff35a0a8b =>
|
10
|
-
# urn_uuid/3c0dce44/80a8/11dd/a897/001ff35a0a8b
|
11
|
-
#
|
12
|
-
# It's well possible there are more perspicacious choices for points to split
|
13
|
-
# the string, but until we hit that limit this'll do.
|
14
|
-
#
|
15
|
-
def to_path
|
16
|
-
'urn_uuid/' + to_s.gsub(/[\:\-]/,'/')
|
17
|
-
end
|
18
|
-
|
19
|
-
def self.hex_to_str str
|
20
|
-
/([\da-f]{8})([\da-f]{4})([\da-f]{4})([\da-f]{4})([\da-f]{12})/.match(str).captures.join '-'
|
21
|
-
end
|
22
|
-
|
23
|
-
|
24
|
-
def self.parse_hex str
|
25
|
-
parse(UUID.hex_to_str(str))
|
26
|
-
end
|
27
|
-
|
28
|
-
# Overrides UUIDTools -- force 32 hex digits (leading zeros)
|
29
|
-
def hexdigest
|
30
|
-
"%032x" % self.to_i
|
31
|
-
end
|
32
|
-
|
33
|
-
end
|
data/lib/imw/utils/validate.rb
DELETED
@@ -1,38 +0,0 @@
|
|
1
|
-
|
2
|
-
|
3
|
-
# Return true if <tt>email</tt> is a valid email address
|
4
|
-
def is_email?(email)
|
5
|
-
raise ArgumentError, "'email' must be a string" if email.class != String
|
6
|
-
return false if email.empty?
|
7
|
-
|
8
|
-
parts = email.split('@')
|
9
|
-
return false if parts.size != 2
|
10
|
-
|
11
|
-
local = parts.first
|
12
|
-
return false if not local =~ /[a-zA-Z0-9_~=+-.]*/ # allowed characters
|
13
|
-
return false if local[0,1] == '.' # starts with .
|
14
|
-
return false if local[-1,1] == '.' # end with .
|
15
|
-
return false if local.include?('..') # can't repeat .
|
16
|
-
|
17
|
-
domain = parts.last
|
18
|
-
return false if not is_domain?(domain)
|
19
|
-
|
20
|
-
return true
|
21
|
-
end
|
22
|
-
|
23
|
-
# Return true if <tt>domain</tt> is a valid domain name
|
24
|
-
def is_domain?(domain)
|
25
|
-
raise ArgumentError, "'domain' must be a string" if domain.class != String
|
26
|
-
return false if domain.empty?
|
27
|
-
|
28
|
-
return false if domain.size > 255 # max number of characters in a domain
|
29
|
-
return false if not domain =~ /^[a-zA-Z0-9.\-]+$/ # allowed characters
|
30
|
-
parts = domain.split('.')
|
31
|
-
return false if parts.size > 127 # max number of subdomains
|
32
|
-
parts.all? {|part| return false if part.size > 63} # max number of characters in a subdomain
|
33
|
-
|
34
|
-
return true
|
35
|
-
end
|
36
|
-
|
37
|
-
|
38
|
-
# puts "#{File.basename(__FILE__)}: As you shape your body to the confines of your container you feel a tremendous sense of validation." # at bottom
|
data/lib/imw/utils/version.rb
DELETED
@@ -1,131 +0,0 @@
|
|
1
|
-
ID,Name,Genus,Species
|
2
|
-
001,Gray-bellied Night Monkey,Aotus,lemurinus
|
3
|
-
002,Panamanian Night Monkey,Aotus,zonalis
|
4
|
-
003,Hernández-Camacho's Night Monkey,Aotus,jorgehernandezi
|
5
|
-
004,Gray-handed Night Monkey,Aotus,griseimembra
|
6
|
-
005,Hershkovitz's Night Monkey,Aotus,hershkovitzi
|
7
|
-
006,Brumback's Night Monkey,Aotus,brumbacki
|
8
|
-
007,Three-striped Night Monkey,Aotus,trivirgatus
|
9
|
-
008,Spix's Night Monkey,Aotus,vociferans
|
10
|
-
009,Malaysian Lar Gibbon,Hylobates,lar lar
|
11
|
-
010,Carpenter's Lar Gibbon,Hylobates,lar carpenteri
|
12
|
-
011,Central Lar Gibbon,Hylobates,lar entelloides
|
13
|
-
012,Sumatran Lar Gibbon,Hylobates,lar vestitus
|
14
|
-
013,Yunnan Lar Gibbon,Hylobates,lar yunnanensis
|
15
|
-
014,Mountain Agile Gibbon,Hylobates,agilis agilis
|
16
|
-
015,Bornean White-bearded Gibbon,Hylobates,agilis albibarbis
|
17
|
-
016,Lowland Agile Gibbon,Hylobates,agilis unko
|
18
|
-
017,Müller's Gray Gibbon,Hylobates,muelleri muelleri
|
19
|
-
018,Abbott's Gray Gibbon,Hylobates,muelleri abbotti
|
20
|
-
019,Northern Gray Gibbon,Hylobates,muelleri funereus
|
21
|
-
020,Black Tamarin,Saguinas,niger
|
22
|
-
021,Black-mantled Tamarin,Saguinas,nigricollis
|
23
|
-
022,Brown-mantled Tamarin,Saguinas,fuscicollis
|
24
|
-
023,Cottontop Tamarin or Pinché Tamarin,Saguinas,oedipus
|
25
|
-
024,Emperor Tamarin,Saguinas,imperator
|
26
|
-
025,Geoffroy's Tamarin,Saguinas,geoffroyi
|
27
|
-
026,Golden-mantled Tamarin,Saguinas,tripartitus
|
28
|
-
027,Graells's Tamarin,Saguinas,graellsi
|
29
|
-
028,Martins's Tamarin,Saguinas,martinsi
|
30
|
-
029,Mottle-faced Tamarin,Saguinas,inustus
|
31
|
-
030,Moustached Tamarin,Saguinas,mystax
|
32
|
-
031,Pied Tamarin,Saguinas,bicolor
|
33
|
-
032,Red-capped Tamarin,Saguinas,pileatus
|
34
|
-
033,Red-handed Tamarin,Saguinas,midas
|
35
|
-
034,White-footed Tamarin,Saguinas,leucopus
|
36
|
-
035,White-lipped Tamarin,Saguinas,labiatus
|
37
|
-
036,White-mantled Tamarin,Saguinas,melanoleucus
|
38
|
-
037,Allen's Swamp Monkey,Allenopithecus,nigroviridis
|
39
|
-
038,Angolan Talapoin,Miopithecus,talapoin
|
40
|
-
039,Gabon Talapoin,Miopithecus,ogouensis
|
41
|
-
040,Patas Monkey,Erythrocebus,patas
|
42
|
-
041,Green Monkey,Chlorocebus,sabaeus
|
43
|
-
042,Grivet,Chlorocebus,aethiops
|
44
|
-
043,Bale Mountains Vervet,Chlorocebus,djamdjamensis
|
45
|
-
044,Tantalus Monkey,Chlorocebus,tantalus
|
46
|
-
045,Vervet Monkey,Chlorocebus,pygerythrus
|
47
|
-
046,Malbrouck,Chlorocebus,cynosuros
|
48
|
-
047,Dryas Monkey or Salongo Monkey,Cercopithecus,dryas
|
49
|
-
048,Diana Monkey,Cercopithecus,diana
|
50
|
-
049,Roloway Monkey,Cercopithecus,roloway
|
51
|
-
050,Greater Spot-nosed Monkey,Cercopithecus,nictitans
|
52
|
-
051,Blue Monkey,Cercopithecus,mitis
|
53
|
-
052,Silver Monkey,Cercopithecus,doggetti
|
54
|
-
053,Golden Monkey,Cercopithecus,kandti
|
55
|
-
054,Sykes's Monkey,Cercopithecus,albogularis
|
56
|
-
055,Mona Monkey,Cercopithecus,mona
|
57
|
-
056,Campbell's Mona Monkey,Cercopithecus,campbelli
|
58
|
-
057,Lowe's Mona Monkey,Cercopithecus,lowei
|
59
|
-
058,Crested Mona Monkey,Cercopithecus,pogonias
|
60
|
-
059,Wolf's Mona Monkey,Cercopithecus,wolfi
|
61
|
-
060,Dent's Mona Monkey,Cercopithecus,denti
|
62
|
-
061,Lesser Spot-nosed Monkey,Cercopithecus,petaurista
|
63
|
-
062,White-throated Guenon,Cercopithecus,erythrogaster
|
64
|
-
063,Sclater's Guenon,Cercopithecus,sclateri
|
65
|
-
064,Red-eared Guenon,Cercopithecus,erythrotis
|
66
|
-
065,Moustached Guenon,Cercopithecus,cephus
|
67
|
-
066,Red-tailed Monkey,Cercopithecus,ascanius
|
68
|
-
067,L'Hoest's Monkey,Cercopithecus,lhoesti
|
69
|
-
068,Preuss's Monkey,Cercopithecus,preussi
|
70
|
-
069,Sun-tailed Monkey,Cercopithecus,solatus
|
71
|
-
070,Hamlyn's Monkey,Cercopithecus,hamlyni
|
72
|
-
071,De Brazza's Monkey,Cercopithecus,neglectus
|
73
|
-
072,Barbary Macaque,Macaca,sylvanus
|
74
|
-
073,Lion-tailed Macaque,Macaca,silenus
|
75
|
-
074,Southern Pig-tailed Macaque or Beruk,Macaca,nemestrina
|
76
|
-
075,Northern Pig-tailed Macaque,Macaca,leonina
|
77
|
-
076,Pagai Island Macaque or Bokkoi,Macaca,pagensis
|
78
|
-
077,Siberut Macaque,Macaca,siberu
|
79
|
-
078,Moor Macaque,Macaca,maura
|
80
|
-
079,Booted Macaque,Macaca,ochreata
|
81
|
-
080,Tonkean Macaque,Macaca,tonkeana
|
82
|
-
081,Heck's Macaque,Macaca,hecki
|
83
|
-
082,Gorontalo Macaque,Macaca,nigrescens
|
84
|
-
083,Celebes Crested Macaque or Black Ape,Macaca,nigra
|
85
|
-
084,Crab-eating Macaque or Long-tailed Macaque or Kera,Macaca,fascicularis
|
86
|
-
085,Stump-tailed Macaque or Bear Macaque,Macaca,arctoides
|
87
|
-
086,Rhesus Macaque,Macaca,mulatta
|
88
|
-
087,Formosan Rock Macaque,Macaca,cyclopis
|
89
|
-
088,Japanese Macaque,Macaca,fuscata
|
90
|
-
089,Toque Macaque,Macaca,sinica
|
91
|
-
090,Bonnet Macaque,Macaca,radiata
|
92
|
-
091,Assam Macaque,Macaca,assamensis
|
93
|
-
092,Tibetan Macaque or Milne-Edwards' Macaque,Macaca,thibetana
|
94
|
-
093,Arunachal Macaque or Munzala,Macaca,munzala
|
95
|
-
094,Grey-cheeked Mangabey,Lophocebus,albigena
|
96
|
-
095,Black Crested Mangabey,Lophocebus,aterrimus
|
97
|
-
096,Opdenbosch's Mangabey,Lophocebus,opdenboschi
|
98
|
-
097,Uganda Mangabey,Lophocebus,ugandae
|
99
|
-
098,Johnston's Mangabey,Lophocebus,johnstoni
|
100
|
-
099,Osman Hill's Mangabey,Lophocebus,osmani
|
101
|
-
100,Kipunji,Rungwecebus,kipunji
|
102
|
-
101,Hamadryas Baboon,Papio,hamadryas
|
103
|
-
102,Guinea Baboon,Papio,papio
|
104
|
-
103,Olive Baboon,Papio,anubis
|
105
|
-
104,Yellow Baboon,Papio,cynocephalus
|
106
|
-
105,Chacma Baboon,Papio,ursinus
|
107
|
-
106,Gelada,Theropithecus,gelada
|
108
|
-
107,Sooty Mangabey,Cercocebus,atys
|
109
|
-
108,Collared Mangabey,Cercocebus,torquatus
|
110
|
-
109,Agile Mangabey,Cercocebus,agilis
|
111
|
-
110,Golden-bellied Mangabey,Cercocebus,chrysogaster
|
112
|
-
111,Tana River Mangabey,Cercocebus,galeritus
|
113
|
-
112,Sanje Mangabey,Cercocebus,sanjei
|
114
|
-
113,Mandrill,Mandrillus,sphinx
|
115
|
-
114,Drill,Mandrillus,leucophaeus
|
116
|
-
115,Black Colobus,Colobus,satanas
|
117
|
-
116,Angola Colobus,Colobus,angolensis
|
118
|
-
117,King Colobus,Colobus,polykomos
|
119
|
-
118,Ursine Colobus,Colobus,vellerosus
|
120
|
-
119,Mantled Guereza,Colobus,guereza
|
121
|
-
120,Western Red Colobus,Piliocolobus,badius
|
122
|
-
121,Pennant's Colobus,Piliocolobus,pennantii
|
123
|
-
122,Preuss's Red Colobus,Piliocolobus,preussi
|
124
|
-
123,Thollon's Red Colobus,Piliocolobus,tholloni
|
125
|
-
124,Central African Red Colobus,Piliocolobus,foai
|
126
|
-
125,Ugandan Red Colobus,Piliocolobus,tephrosceles
|
127
|
-
126,Uzungwa Red Colobus,Piliocolobus,gordonorum
|
128
|
-
127,Zanzibar Red Colobus,Piliocolobus,kirkii
|
129
|
-
128,Tana River Red Colobus,Piliocolobus,rufomitratus
|
130
|
-
129,Olive Colobus,Procolobus,verus
|
131
|
-
130,Maroon Leaf Monkey,Presbytis,rubicunda
|
@@ -1,131 +0,0 @@
|
|
1
|
-
ID Name Genus Species
|
2
|
-
001 Gray-bellied Night Monkey Aotus lemurinus
|
3
|
-
002 Panamanian Night Monkey Aotus zonalis
|
4
|
-
003 Hernández-Camacho's Night Monkey Aotus jorgehernandezi
|
5
|
-
004 Gray-handed Night Monkey Aotus griseimembra
|
6
|
-
005 Hershkovitz's Night Monkey Aotus hershkovitzi
|
7
|
-
006 Brumback's Night Monkey Aotus brumbacki
|
8
|
-
007 Three-striped Night Monkey Aotus trivirgatus
|
9
|
-
008 Spix's Night Monkey Aotus vociferans
|
10
|
-
009 Malaysian Lar Gibbon Hylobates lar lar
|
11
|
-
010 Carpenter's Lar Gibbon Hylobates lar carpenteri
|
12
|
-
011 Central Lar Gibbon Hylobates lar entelloides
|
13
|
-
012 Sumatran Lar Gibbon Hylobates lar vestitus
|
14
|
-
013 Yunnan Lar Gibbon Hylobates lar yunnanensis
|
15
|
-
014 Mountain Agile Gibbon Hylobates agilis agilis
|
16
|
-
015 Bornean White-bearded Gibbon Hylobates agilis albibarbis
|
17
|
-
016 Lowland Agile Gibbon Hylobates agilis unko
|
18
|
-
017 Müller's Gray Gibbon Hylobates muelleri muelleri
|
19
|
-
018 Abbott's Gray Gibbon Hylobates muelleri abbotti
|
20
|
-
019 Northern Gray Gibbon Hylobates muelleri funereus
|
21
|
-
020 Black Tamarin Saguinas niger
|
22
|
-
021 Black-mantled Tamarin Saguinas nigricollis
|
23
|
-
022 Brown-mantled Tamarin Saguinas fuscicollis
|
24
|
-
023 Cottontop Tamarin or Pinché Tamarin Saguinas oedipus
|
25
|
-
024 Emperor Tamarin Saguinas imperator
|
26
|
-
025 Geoffroy's Tamarin Saguinas geoffroyi
|
27
|
-
026 Golden-mantled Tamarin Saguinas tripartitus
|
28
|
-
027 Graells's Tamarin Saguinas graellsi
|
29
|
-
028 Martins's Tamarin Saguinas martinsi
|
30
|
-
029 Mottle-faced Tamarin Saguinas inustus
|
31
|
-
030 Moustached Tamarin Saguinas mystax
|
32
|
-
031 Pied Tamarin Saguinas bicolor
|
33
|
-
032 Red-capped Tamarin Saguinas pileatus
|
34
|
-
033 Red-handed Tamarin Saguinas midas
|
35
|
-
034 White-footed Tamarin Saguinas leucopus
|
36
|
-
035 White-lipped Tamarin Saguinas labiatus
|
37
|
-
036 White-mantled Tamarin Saguinas melanoleucus
|
38
|
-
037 Allen's Swamp Monkey Allenopithecus nigroviridis
|
39
|
-
038 Angolan Talapoin Miopithecus talapoin
|
40
|
-
039 Gabon Talapoin Miopithecus ogouensis
|
41
|
-
040 Patas Monkey Erythrocebus patas
|
42
|
-
041 Green Monkey Chlorocebus sabaeus
|
43
|
-
042 Grivet Chlorocebus aethiops
|
44
|
-
043 Bale Mountains Vervet Chlorocebus djamdjamensis
|
45
|
-
044 Tantalus Monkey Chlorocebus tantalus
|
46
|
-
045 Vervet Monkey Chlorocebus pygerythrus
|
47
|
-
046 Malbrouck Chlorocebus cynosuros
|
48
|
-
047 Dryas Monkey or Salongo Monkey Cercopithecus dryas
|
49
|
-
048 Diana Monkey Cercopithecus diana
|
50
|
-
049 Roloway Monkey Cercopithecus roloway
|
51
|
-
050 Greater Spot-nosed Monkey Cercopithecus nictitans
|
52
|
-
051 Blue Monkey Cercopithecus mitis
|
53
|
-
052 Silver Monkey Cercopithecus doggetti
|
54
|
-
053 Golden Monkey Cercopithecus kandti
|
55
|
-
054 Sykes's Monkey Cercopithecus albogularis
|
56
|
-
055 Mona Monkey Cercopithecus mona
|
57
|
-
056 Campbell's Mona Monkey Cercopithecus campbelli
|
58
|
-
057 Lowe's Mona Monkey Cercopithecus lowei
|
59
|
-
058 Crested Mona Monkey Cercopithecus pogonias
|
60
|
-
059 Wolf's Mona Monkey Cercopithecus wolfi
|
61
|
-
060 Dent's Mona Monkey Cercopithecus denti
|
62
|
-
061 Lesser Spot-nosed Monkey Cercopithecus petaurista
|
63
|
-
062 White-throated Guenon Cercopithecus erythrogaster
|
64
|
-
063 Sclater's Guenon Cercopithecus sclateri
|
65
|
-
064 Red-eared Guenon Cercopithecus erythrotis
|
66
|
-
065 Moustached Guenon Cercopithecus cephus
|
67
|
-
066 Red-tailed Monkey Cercopithecus ascanius
|
68
|
-
067 L'Hoest's Monkey Cercopithecus lhoesti
|
69
|
-
068 Preuss's Monkey Cercopithecus preussi
|
70
|
-
069 Sun-tailed Monkey Cercopithecus solatus
|
71
|
-
070 Hamlyn's Monkey Cercopithecus hamlyni
|
72
|
-
071 De Brazza's Monkey Cercopithecus neglectus
|
73
|
-
072 Barbary Macaque Macaca sylvanus
|
74
|
-
073 Lion-tailed Macaque Macaca silenus
|
75
|
-
074 Southern Pig-tailed Macaque or Beruk Macaca nemestrina
|
76
|
-
075 Northern Pig-tailed Macaque Macaca leonina
|
77
|
-
076 Pagai Island Macaque or Bokkoi Macaca pagensis
|
78
|
-
077 Siberut Macaque Macaca siberu
|
79
|
-
078 Moor Macaque Macaca maura
|
80
|
-
079 Booted Macaque Macaca ochreata
|
81
|
-
080 Tonkean Macaque Macaca tonkeana
|
82
|
-
081 Heck's Macaque Macaca hecki
|
83
|
-
082 Gorontalo Macaque Macaca nigrescens
|
84
|
-
083 Celebes Crested Macaque or Black Ape Macaca nigra
|
85
|
-
084 Crab-eating Macaque or Long-tailed Macaque or Kera Macaca fascicularis
|
86
|
-
085 Stump-tailed Macaque or Bear Macaque Macaca arctoides
|
87
|
-
086 Rhesus Macaque Macaca mulatta
|
88
|
-
087 Formosan Rock Macaque Macaca cyclopis
|
89
|
-
088 Japanese Macaque Macaca fuscata
|
90
|
-
089 Toque Macaque Macaca sinica
|
91
|
-
090 Bonnet Macaque Macaca radiata
|
92
|
-
091 Assam Macaque Macaca assamensis
|
93
|
-
092 Tibetan Macaque or Milne-Edwards' Macaque Macaca thibetana
|
94
|
-
093 Arunachal Macaque or Munzala Macaca munzala
|
95
|
-
094 Grey-cheeked Mangabey Lophocebus albigena
|
96
|
-
095 Black Crested Mangabey Lophocebus aterrimus
|
97
|
-
096 Opdenbosch's Mangabey Lophocebus opdenboschi
|
98
|
-
097 Uganda Mangabey Lophocebus ugandae
|
99
|
-
098 Johnston's Mangabey Lophocebus johnstoni
|
100
|
-
099 Osman Hill's Mangabey Lophocebus osmani
|
101
|
-
100 Kipunji Rungwecebus kipunji
|
102
|
-
101 Hamadryas Baboon Papio hamadryas
|
103
|
-
102 Guinea Baboon Papio papio
|
104
|
-
103 Olive Baboon Papio anubis
|
105
|
-
104 Yellow Baboon Papio cynocephalus
|
106
|
-
105 Chacma Baboon Papio ursinus
|
107
|
-
106 Gelada Theropithecus gelada
|
108
|
-
107 Sooty Mangabey Cercocebus atys
|
109
|
-
108 Collared Mangabey Cercocebus torquatus
|
110
|
-
109 Agile Mangabey Cercocebus agilis
|
111
|
-
110 Golden-bellied Mangabey Cercocebus chrysogaster
|
112
|
-
111 Tana River Mangabey Cercocebus galeritus
|
113
|
-
112 Sanje Mangabey Cercocebus sanjei
|
114
|
-
113 Mandrill Mandrillus sphinx
|
115
|
-
114 Drill Mandrillus leucophaeus
|
116
|
-
115 Black Colobus Colobus satanas
|
117
|
-
116 Angola Colobus Colobus angolensis
|
118
|
-
117 King Colobus Colobus polykomos
|
119
|
-
118 Ursine Colobus Colobus vellerosus
|
120
|
-
119 Mantled Guereza Colobus guereza
|
121
|
-
120 Western Red Colobus Piliocolobus badius
|
122
|
-
121 Pennant's Colobus Piliocolobus pennantii
|
123
|
-
122 Preuss's Red Colobus Piliocolobus preussi
|
124
|
-
123 Thollon's Red Colobus Piliocolobus tholloni
|
125
|
-
124 Central African Red Colobus Piliocolobus foai
|
126
|
-
125 Ugandan Red Colobus Piliocolobus tephrosceles
|
127
|
-
126 Uzungwa Red Colobus Piliocolobus gordonorum
|
128
|
-
127 Zanzibar Red Colobus Piliocolobus kirkii
|
129
|
-
128 Tana River Red Colobus Piliocolobus rufomitratus
|
130
|
-
129 Olive Colobus Procolobus verus
|
131
|
-
130 Maroon Leaf Monkey Presbytis rubicunda
|
@@ -1,11 +0,0 @@
|
|
1
|
-
Store Number Store Name Address City State Zip Phone Number Latitude Longitude
|
2
|
-
10344 Ace Gambles of Hotchkiss 121 E. Bridge Street Hotchkiss CO 81419 (970) 872-3535 38.7988 -107.7205
|
3
|
-
10347 Al's Ace Hardware 4010 E 29th St Tucson AZ 85711 (520) 747-8144 32.1996 -110.9059
|
4
|
-
10349 Al's Ace Hardware 4722 E Broadway Blvd Tucson AZ 85711 (520) 318-0414 32.2216 -110.8916
|
5
|
-
10351 Al's Ace Hardware 2884 N Campbell Ave Tucson AZ 85719 (520) 325-2432 32.259 -110.9428
|
6
|
-
10353 Lewistown Ace Hardware 815 NE Main St Lewistown MT 59457 (406) 538-4000 47.0702 -109.409
|
7
|
-
10356 Byram Revell Ace Hardware 5726 Terry Rd Jackson MS 39272 (601) 371-8429 32.1919 -90.2542
|
8
|
-
10357 Mr C's Ace Hardware 1201 Precinct Line Rd Hurst TX 76053 (817) 282-3428 32.831 -97.186
|
9
|
-
10358 Gus Bock Ace Hardware 3455 Ridge Rd Lansing IL 60438 (708) 474-5940 41.5643 -87.5321
|
10
|
-
10359 Elberton Ace Hardware 886 Elbert St Elberton GA 30635 (706) 283-3054 34.1008 -82.8495
|
11
|
-
10361 Phil's Hardware 13 SW H St Madras OR 97741 (541) 475-9392 44.627737 -121.13004
|
data/spec/data/formats/delimited/with_schema/all-countries-ip-address-to-geolocation-data.tsv
DELETED
@@ -1,16 +0,0 @@
|
|
1
|
-
IP_BeginNum IP_EndNum IP_SubBlock IP_Begin IP_End Country State City ZipCode Latitude Longitude MetroCode AreaCode
|
2
|
-
16777216 16842751 256 1.0.0.0 1.0.255.255 AP 35.0 105.0
|
3
|
-
16842752 16908287 257 1.1.0.0 1.1.255.255 AP 35.0 105.0
|
4
|
-
16908288 16973823 258 1.2.0.0 1.2.255.255 AP 35.0 105.0
|
5
|
-
16973824 17039359 259 1.3.0.0 1.3.255.255 AP 35.0 105.0
|
6
|
-
17039360 17104895 260 1.4.0.0 1.4.255.255 AP 35.0 105.0
|
7
|
-
17104896 17170431 261 1.5.0.0 1.5.255.255 AP 35.0 105.0
|
8
|
-
17170432 17235967 262 1.6.0.0 1.6.255.255 AP 35.0 105.0
|
9
|
-
17235968 17301503 263 1.7.0.0 1.7.255.255 AP 35.0 105.0
|
10
|
-
17301504 17367039 264 1.8.0.0 1.8.255.255 AP 35.0 105.0
|
11
|
-
17367040 17432575 265 1.9.0.0 1.9.255.255 AP 35.0 105.0
|
12
|
-
17432576 17498111 266 1.10.0.0 1.10.255.255 AP 35.0 105.0
|
13
|
-
17498112 17563647 267 1.11.0.0 1.11.255.255 AP 35.0 105.0
|
14
|
-
17563648 17629183 268 1.12.0.0 1.12.255.255 AP 35.0 105.0
|
15
|
-
17629184 17694719 269 1.13.0.0 1.13.255.255 AP 35.0 105.0
|
16
|
-
17694720 17760255 270 1.14.0.0 1.14.255.255 AP 35.0 105.0
|
@@ -1,11 +0,0 @@
|
|
1
|
-
Store Number Store Name Address City State Zip Phone Wireless Latitude Longitude
|
2
|
-
103704 Grand & Reems, Surprise 18885 N. Reems Road - #105 Surprise AZ 85374 623-584-5015 wireless 33.646084 -112.389903
|
3
|
-
98887 Safeway-Sun City West #1520 14505 W Grand Ave Surprise AZ 85374 623-975-4022 33.655002 -112.371358
|
4
|
-
97730 Safeway-Surprise #1997 17049 W Bell Rd Surprise AZ 85374 623-518-1059 33.638805 -112.42561
|
5
|
-
97179 Safeway-Surprise #2699 13828 W Waddell Rd Surprise AZ 85374 623-476-1810 33.609216 -112.357999
|
6
|
-
23371 Albertsons-Tempe AZ #940 750 E Guadalupe Rd Tempe AZ 85283 480-820-8166 33.364742 -111.92974
|
7
|
-
78041 Aramark ASU Bookstore 525 E. Orange St. Tempe AZ 85287 480-727-0830 33.418367 -111.931272
|
8
|
-
78040 Aramark ASU Business College College of Business 1st Floor Tempe AZ 85287 480-727-0019 33.4148 -111.9088
|
9
|
-
78022 Aramark ASU Memorial Union 2090 S Normal Tempe AZ 85287 480-727-7480 33.416721 -111.933296
|
10
|
-
94352 Aramark ASU Palo Verde East 340 E University Dr Tempe AZ 85287 480-727-0462 33.421975 -111.934342
|
11
|
-
1417 Arizona Mills 5000 Arizona Mills Circle - Suite #391 Tempe AZ 85282 (480) 897-4804 wireless 33.379419 -111.965053
|
@@ -1,22 +0,0 @@
|
|
1
|
-
Word Count
|
2
|
-
accaldata 4
|
3
|
-
accaldato 4
|
4
|
-
accalia 124
|
5
|
-
accallonato 2
|
6
|
-
accally 3
|
7
|
-
accalmie 5
|
8
|
-
accaly 4
|
9
|
-
accampato 2
|
10
|
-
accanimento 2
|
11
|
-
accanisce 4
|
12
|
-
accaniti 4
|
13
|
-
accanito 3
|
14
|
-
accannate 3
|
15
|
-
accannato 3
|
16
|
-
accant 8
|
17
|
-
accanto 135
|
18
|
-
accantonate 2
|
19
|
-
accaount 7
|
20
|
-
accapalla 3
|
21
|
-
accapar 6
|
22
|
-
accape 2
|
@@ -1,22 +0,0 @@
|
|
1
|
-
ZIP Code Application Count
|
2
|
-
10000 Dragon Wars 9
|
3
|
-
10000 SuperPoke Pets 179
|
4
|
-
10000 Dancing Bananas_ 75
|
5
|
-
10000 digitck 1
|
6
|
-
10000 Random Friend Viewer 56
|
7
|
-
10000 Daily Horoscope 1
|
8
|
-
10000 FARKLE 30
|
9
|
-
10000 Chat 12
|
10
|
-
10000 Hero World 47
|
11
|
-
10000 PinkRibbon 7
|
12
|
-
10000 Super Slot Machines 47
|
13
|
-
10000 RSS Reader 5
|
14
|
-
10000 SexGames 36
|
15
|
-
10001 Astrology 18
|
16
|
-
10001 Rockstars 3
|
17
|
-
10001 Movies 50
|
18
|
-
10001 Green Spot 30
|
19
|
-
10001 RockYou Pets 95
|
20
|
-
10001 Tag Me 1415
|
21
|
-
10001 Nitrous Racing 18
|
22
|
-
10001 Baby Animals Dressup Tiger 3
|
@@ -1,12 +0,0 @@
|
|
1
|
-
Application Count
|
2
|
-
Addicted to Xena 13
|
3
|
-
Addicted to Zoey 101 4
|
4
|
-
Addicting Games - Free Kicker 3
|
5
|
-
Addiction 10
|
6
|
-
Adopt A Pet 176
|
7
|
-
Adopt a Friend 660
|
8
|
-
Adorable Pet Chinchilla 64
|
9
|
-
Adorable Puppies 32
|
10
|
-
Adorable Twins 7
|
11
|
-
Adorninho against the Tsunami 1
|
12
|
-
Adrenaline Challenge 30
|