anystyle 1.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (82) hide show
  1. checksums.yaml +7 -0
  2. data/HISTORY.md +78 -0
  3. data/LICENSE +27 -0
  4. data/README.md +103 -0
  5. data/lib/anystyle.rb +71 -0
  6. data/lib/anystyle/dictionary.rb +132 -0
  7. data/lib/anystyle/dictionary/gdbm.rb +52 -0
  8. data/lib/anystyle/dictionary/lmdb.rb +67 -0
  9. data/lib/anystyle/dictionary/marshal.rb +27 -0
  10. data/lib/anystyle/dictionary/redis.rb +55 -0
  11. data/lib/anystyle/document.rb +264 -0
  12. data/lib/anystyle/errors.rb +14 -0
  13. data/lib/anystyle/feature.rb +27 -0
  14. data/lib/anystyle/feature/affix.rb +43 -0
  15. data/lib/anystyle/feature/brackets.rb +32 -0
  16. data/lib/anystyle/feature/canonical.rb +13 -0
  17. data/lib/anystyle/feature/caps.rb +20 -0
  18. data/lib/anystyle/feature/category.rb +70 -0
  19. data/lib/anystyle/feature/dictionary.rb +16 -0
  20. data/lib/anystyle/feature/indent.rb +16 -0
  21. data/lib/anystyle/feature/keyword.rb +52 -0
  22. data/lib/anystyle/feature/line.rb +39 -0
  23. data/lib/anystyle/feature/locator.rb +18 -0
  24. data/lib/anystyle/feature/number.rb +39 -0
  25. data/lib/anystyle/feature/position.rb +28 -0
  26. data/lib/anystyle/feature/punctuation.rb +22 -0
  27. data/lib/anystyle/feature/quotes.rb +20 -0
  28. data/lib/anystyle/feature/ref.rb +21 -0
  29. data/lib/anystyle/feature/terminal.rb +19 -0
  30. data/lib/anystyle/feature/words.rb +74 -0
  31. data/lib/anystyle/finder.rb +94 -0
  32. data/lib/anystyle/format/bibtex.rb +63 -0
  33. data/lib/anystyle/format/csl.rb +28 -0
  34. data/lib/anystyle/normalizer.rb +65 -0
  35. data/lib/anystyle/normalizer/brackets.rb +13 -0
  36. data/lib/anystyle/normalizer/container.rb +13 -0
  37. data/lib/anystyle/normalizer/date.rb +109 -0
  38. data/lib/anystyle/normalizer/edition.rb +16 -0
  39. data/lib/anystyle/normalizer/journal.rb +14 -0
  40. data/lib/anystyle/normalizer/locale.rb +30 -0
  41. data/lib/anystyle/normalizer/location.rb +24 -0
  42. data/lib/anystyle/normalizer/locator.rb +22 -0
  43. data/lib/anystyle/normalizer/names.rb +88 -0
  44. data/lib/anystyle/normalizer/page.rb +29 -0
  45. data/lib/anystyle/normalizer/publisher.rb +18 -0
  46. data/lib/anystyle/normalizer/pubmed.rb +18 -0
  47. data/lib/anystyle/normalizer/punctuation.rb +23 -0
  48. data/lib/anystyle/normalizer/quotes.rb +14 -0
  49. data/lib/anystyle/normalizer/type.rb +54 -0
  50. data/lib/anystyle/normalizer/volume.rb +26 -0
  51. data/lib/anystyle/parser.rb +199 -0
  52. data/lib/anystyle/support.rb +4 -0
  53. data/lib/anystyle/support/finder.mod +3234 -0
  54. data/lib/anystyle/support/finder.txt +75 -0
  55. data/lib/anystyle/support/parser.mod +15025 -0
  56. data/lib/anystyle/support/parser.txt +75 -0
  57. data/lib/anystyle/utils.rb +70 -0
  58. data/lib/anystyle/version.rb +3 -0
  59. data/res/finder/bb132pr2055.ttx +6803 -0
  60. data/res/finder/bb550sh8053.ttx +18660 -0
  61. data/res/finder/bb599nz4341.ttx +2957 -0
  62. data/res/finder/bb725rt6501.ttx +15276 -0
  63. data/res/finder/bc605xz1554.ttx +18815 -0
  64. data/res/finder/bd040gx5718.ttx +4271 -0
  65. data/res/finder/bd413nt2715.ttx +4956 -0
  66. data/res/finder/bd466fq0394.ttx +6100 -0
  67. data/res/finder/bf668vw2021.ttx +3578 -0
  68. data/res/finder/bg495cx0468.ttx +7267 -0
  69. data/res/finder/bg599vt3743.ttx +6752 -0
  70. data/res/finder/bg608dx2253.ttx +4094 -0
  71. data/res/finder/bh410qk3771.ttx +8785 -0
  72. data/res/finder/bh989ww6442.ttx +17204 -0
  73. data/res/finder/bj581pc8202.ttx +2719 -0
  74. data/res/parser/bad.xml +5199 -0
  75. data/res/parser/core.xml +7924 -0
  76. data/res/parser/gold.xml +2707 -0
  77. data/res/parser/good.xml +34281 -0
  78. data/res/parser/stanford-books.xml +2280 -0
  79. data/res/parser/stanford-diss.xml +726 -0
  80. data/res/parser/stanford-theses.xml +4684 -0
  81. data/res/parser/ugly.xml +33246 -0
  82. metadata +195 -0
metadata ADDED
@@ -0,0 +1,195 @@
1
+ --- !ruby/object:Gem::Specification
2
+ name: anystyle
3
+ version: !ruby/object:Gem::Version
4
+ version: 1.0.0
5
+ platform: ruby
6
+ authors:
7
+ - Sylvester Keil
8
+ autorequire:
9
+ bindir: bin
10
+ cert_chain: []
11
+ date: 2018-06-06 00:00:00.000000000 Z
12
+ dependencies:
13
+ - !ruby/object:Gem::Dependency
14
+ name: bibtex-ruby
15
+ requirement: !ruby/object:Gem::Requirement
16
+ requirements:
17
+ - - "~>"
18
+ - !ruby/object:Gem::Version
19
+ version: '4.0'
20
+ type: :runtime
21
+ prerelease: false
22
+ version_requirements: !ruby/object:Gem::Requirement
23
+ requirements:
24
+ - - "~>"
25
+ - !ruby/object:Gem::Version
26
+ version: '4.0'
27
+ - !ruby/object:Gem::Dependency
28
+ name: anystyle-data
29
+ requirement: !ruby/object:Gem::Requirement
30
+ requirements:
31
+ - - "~>"
32
+ - !ruby/object:Gem::Version
33
+ version: '1.2'
34
+ type: :runtime
35
+ prerelease: false
36
+ version_requirements: !ruby/object:Gem::Requirement
37
+ requirements:
38
+ - - "~>"
39
+ - !ruby/object:Gem::Version
40
+ version: '1.2'
41
+ - !ruby/object:Gem::Dependency
42
+ name: wapiti
43
+ requirement: !ruby/object:Gem::Requirement
44
+ requirements:
45
+ - - "~>"
46
+ - !ruby/object:Gem::Version
47
+ version: '1.0'
48
+ - - ">="
49
+ - !ruby/object:Gem::Version
50
+ version: 1.0.2
51
+ type: :runtime
52
+ prerelease: false
53
+ version_requirements: !ruby/object:Gem::Requirement
54
+ requirements:
55
+ - - "~>"
56
+ - !ruby/object:Gem::Version
57
+ version: '1.0'
58
+ - - ">="
59
+ - !ruby/object:Gem::Version
60
+ version: 1.0.2
61
+ - !ruby/object:Gem::Dependency
62
+ name: namae
63
+ requirement: !ruby/object:Gem::Requirement
64
+ requirements:
65
+ - - "~>"
66
+ - !ruby/object:Gem::Version
67
+ version: '1.0'
68
+ type: :runtime
69
+ prerelease: false
70
+ version_requirements: !ruby/object:Gem::Requirement
71
+ requirements:
72
+ - - "~>"
73
+ - !ruby/object:Gem::Version
74
+ version: '1.0'
75
+ description: A sophisticated parser for academic reference lists and bibliographies
76
+ based on machine learning algorithms using conditional random fields.
77
+ email:
78
+ - http://sylvester.keil.or.at
79
+ executables: []
80
+ extensions: []
81
+ extra_rdoc_files:
82
+ - README.md
83
+ - LICENSE
84
+ files:
85
+ - HISTORY.md
86
+ - LICENSE
87
+ - README.md
88
+ - lib/anystyle.rb
89
+ - lib/anystyle/dictionary.rb
90
+ - lib/anystyle/dictionary/gdbm.rb
91
+ - lib/anystyle/dictionary/lmdb.rb
92
+ - lib/anystyle/dictionary/marshal.rb
93
+ - lib/anystyle/dictionary/redis.rb
94
+ - lib/anystyle/document.rb
95
+ - lib/anystyle/errors.rb
96
+ - lib/anystyle/feature.rb
97
+ - lib/anystyle/feature/affix.rb
98
+ - lib/anystyle/feature/brackets.rb
99
+ - lib/anystyle/feature/canonical.rb
100
+ - lib/anystyle/feature/caps.rb
101
+ - lib/anystyle/feature/category.rb
102
+ - lib/anystyle/feature/dictionary.rb
103
+ - lib/anystyle/feature/indent.rb
104
+ - lib/anystyle/feature/keyword.rb
105
+ - lib/anystyle/feature/line.rb
106
+ - lib/anystyle/feature/locator.rb
107
+ - lib/anystyle/feature/number.rb
108
+ - lib/anystyle/feature/position.rb
109
+ - lib/anystyle/feature/punctuation.rb
110
+ - lib/anystyle/feature/quotes.rb
111
+ - lib/anystyle/feature/ref.rb
112
+ - lib/anystyle/feature/terminal.rb
113
+ - lib/anystyle/feature/words.rb
114
+ - lib/anystyle/finder.rb
115
+ - lib/anystyle/format/bibtex.rb
116
+ - lib/anystyle/format/csl.rb
117
+ - lib/anystyle/normalizer.rb
118
+ - lib/anystyle/normalizer/brackets.rb
119
+ - lib/anystyle/normalizer/container.rb
120
+ - lib/anystyle/normalizer/date.rb
121
+ - lib/anystyle/normalizer/edition.rb
122
+ - lib/anystyle/normalizer/journal.rb
123
+ - lib/anystyle/normalizer/locale.rb
124
+ - lib/anystyle/normalizer/location.rb
125
+ - lib/anystyle/normalizer/locator.rb
126
+ - lib/anystyle/normalizer/names.rb
127
+ - lib/anystyle/normalizer/page.rb
128
+ - lib/anystyle/normalizer/publisher.rb
129
+ - lib/anystyle/normalizer/pubmed.rb
130
+ - lib/anystyle/normalizer/punctuation.rb
131
+ - lib/anystyle/normalizer/quotes.rb
132
+ - lib/anystyle/normalizer/type.rb
133
+ - lib/anystyle/normalizer/volume.rb
134
+ - lib/anystyle/parser.rb
135
+ - lib/anystyle/support.rb
136
+ - lib/anystyle/support/finder.mod
137
+ - lib/anystyle/support/finder.txt
138
+ - lib/anystyle/support/parser.mod
139
+ - lib/anystyle/support/parser.txt
140
+ - lib/anystyle/utils.rb
141
+ - lib/anystyle/version.rb
142
+ - res/finder/bb132pr2055.ttx
143
+ - res/finder/bb550sh8053.ttx
144
+ - res/finder/bb599nz4341.ttx
145
+ - res/finder/bb725rt6501.ttx
146
+ - res/finder/bc605xz1554.ttx
147
+ - res/finder/bd040gx5718.ttx
148
+ - res/finder/bd413nt2715.ttx
149
+ - res/finder/bd466fq0394.ttx
150
+ - res/finder/bf668vw2021.ttx
151
+ - res/finder/bg495cx0468.ttx
152
+ - res/finder/bg599vt3743.ttx
153
+ - res/finder/bg608dx2253.ttx
154
+ - res/finder/bh410qk3771.ttx
155
+ - res/finder/bh989ww6442.ttx
156
+ - res/finder/bj581pc8202.ttx
157
+ - res/parser/bad.xml
158
+ - res/parser/core.xml
159
+ - res/parser/gold.xml
160
+ - res/parser/good.xml
161
+ - res/parser/stanford-books.xml
162
+ - res/parser/stanford-diss.xml
163
+ - res/parser/stanford-theses.xml
164
+ - res/parser/ugly.xml
165
+ homepage: http://anystyle.io
166
+ licenses:
167
+ - BSD-2-Clause
168
+ metadata: {}
169
+ post_install_message:
170
+ rdoc_options:
171
+ - "--line-numbers"
172
+ - "--inline-source"
173
+ - "--title"
174
+ - '"AnyStyle"'
175
+ - "--main"
176
+ - README.md
177
+ require_paths:
178
+ - lib
179
+ required_ruby_version: !ruby/object:Gem::Requirement
180
+ requirements:
181
+ - - ">="
182
+ - !ruby/object:Gem::Version
183
+ version: '2.2'
184
+ required_rubygems_version: !ruby/object:Gem::Requirement
185
+ requirements:
186
+ - - ">="
187
+ - !ruby/object:Gem::Version
188
+ version: '0'
189
+ requirements: []
190
+ rubyforge_project:
191
+ rubygems_version: 2.7.4
192
+ signing_key:
193
+ specification_version: 4
194
+ summary: Smart and fast bibliography parser.
195
+ test_files: []