nlpir 0.0.4-x86-mingw32
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +7 -0
- data/.gitignore +17 -0
- data/LICENSE.txt +22 -0
- data/README.md +195 -0
- data/Rakefile +11 -0
- data/bin/NLPIR.dll +0 -0
- data/lib/Data/BIG2GBK.map +0 -0
- data/lib/Data/BIG5.pdat +0 -0
- data/lib/Data/BIG5.wordlist +0 -0
- data/lib/Data/BiWord.big +0 -0
- data/lib/Data/Configure.xml +15 -0
- data/lib/Data/CoreDict.pdat +0 -0
- data/lib/Data/CoreDict.pos +0 -0
- data/lib/Data/CoreDict.unig +0 -0
- data/lib/Data/FieldDict.pdat +0 -0
- data/lib/Data/FieldDict.pos +0 -0
- data/lib/Data/GBK.pdat +0 -0
- data/lib/Data/GBK.wordlist +0 -0
- data/lib/Data/GBK2BIG.map +0 -0
- data/lib/Data/GBK2GBKC.map +0 -0
- data/lib/Data/GBK2UTF.map +0 -0
- data/lib/Data/GBKA.pdat +0 -0
- data/lib/Data/GBKA.wordlist +0 -0
- data/lib/Data/GBKA2UTF.map +0 -0
- data/lib/Data/GBKC.pdat +0 -0
- data/lib/Data/GBKC.wordlist +0 -0
- data/lib/Data/GBKC2GBK.map +0 -0
- data/lib/Data/GranDict.pdat +3369 -8
- data/lib/Data/GranDict.pos +0 -0
- data/lib/Data/ICTPOS.map +96 -0
- data/lib/Data/NLPIR.ctx +0 -0
- data/lib/Data/NLPIR.user +0 -0
- data/lib/Data/NLPIR_First.map +96 -0
- data/lib/Data/NewWord.lst +25 -0
- data/lib/Data/PKU.map +96 -0
- data/lib/Data/PKU_First.map +96 -0
- data/lib/Data/UTF2GBK.map +0 -0
- data/lib/Data/UTF2GBKA.map +0 -0
- data/lib/Data/UTF8.pdat +0 -0
- data/lib/Data/UTF8.wordlist +0 -0
- data/lib/Data/UserDict.pdat +0 -0
- data/lib/Data/charset.type +0 -0
- data/lib/Data/nr.ctx +0 -0
- data/lib/Data/nr.fsa +0 -0
- data/lib/Data/nr.role +0 -0
- data/lib/nlpir/version.rb +3 -0
- data/lib/nlpir.rb +275 -0
- data/nlpir.gemspec +25 -0
- data/test/Data/BIG2GBK.map +0 -0
- data/test/Data/BIG5.pdat +0 -0
- data/test/Data/BIG5.wordlist +0 -0
- data/test/Data/BiWord.big +0 -0
- data/test/Data/Configure.xml +15 -0
- data/test/Data/CoreDict.pdat +0 -0
- data/test/Data/CoreDict.pos +0 -0
- data/test/Data/CoreDict.unig +0 -0
- data/test/Data/FieldDict.pdat +0 -0
- data/test/Data/FieldDict.pos +0 -0
- data/test/Data/GBK.pdat +0 -0
- data/test/Data/GBK.wordlist +0 -0
- data/test/Data/GBK2BIG.map +0 -0
- data/test/Data/GBK2GBKC.map +0 -0
- data/test/Data/GBK2UTF.map +0 -0
- data/test/Data/GBKA.pdat +0 -0
- data/test/Data/GBKA.wordlist +0 -0
- data/test/Data/GBKA2UTF.map +0 -0
- data/test/Data/GBKC.pdat +0 -0
- data/test/Data/GBKC.wordlist +0 -0
- data/test/Data/GBKC2GBK.map +0 -0
- data/test/Data/GranDict.pdat +3369 -8
- data/test/Data/GranDict.pos +0 -0
- data/test/Data/ICTPOS.map +96 -0
- data/test/Data/NLPIR.ctx +0 -0
- data/test/Data/NLPIR.user +0 -0
- data/test/Data/NLPIR_First.map +96 -0
- data/test/Data/NewWord.lst +73 -0
- data/test/Data/PKU.map +96 -0
- data/test/Data/PKU_First.map +96 -0
- data/test/Data/UTF2GBK.map +0 -0
- data/test/Data/UTF2GBKA.map +0 -0
- data/test/Data/UTF8.pdat +0 -0
- data/test/Data/UTF8.wordlist +0 -0
- data/test/Data/UserDict.pdat +0 -0
- data/test/Data/charset.type +0 -0
- data/test/Data/nr.ctx +0 -0
- data/test/Data/nr.fsa +0 -0
- data/test/Data/nr.role +0 -0
- data/test/test.txt +52 -0
- data/test/test_nlpir.rb +158 -0
- data/test/test_result.txt +87 -0
- data/test/userdict.txt +5 -0
- metadata +206 -0
data/nlpir.gemspec
ADDED
@@ -0,0 +1,25 @@
|
|
1
|
+
# coding: utf-8
|
2
|
+
lib = File.expand_path('../lib', __FILE__)
|
3
|
+
$LOAD_PATH.unshift(lib) unless $LOAD_PATH.include?(lib)
|
4
|
+
require 'nlpir/version'
|
5
|
+
|
6
|
+
Gem::Specification.new do |spec|
|
7
|
+
spec.name = "nlpir"
|
8
|
+
spec.version = Nlpir::VERSION
|
9
|
+
spec.authors = ["JoeWoo"]
|
10
|
+
spec.email = ["0wujian0@gmail.com"]
|
11
|
+
spec.description = %q{"A rubygem wrapper of chinese segment tools ICTCLAS2013"}
|
12
|
+
spec.summary = %q{"ICTCLAS是由中国科学院计算技术研究所研发。中文分词;词性标注;命名实体识别;新词识别;同时支持用户词典。"}
|
13
|
+
spec.homepage = "https://github.com/JoeWoo/nlpir_win"
|
14
|
+
spec.license = "MIT"
|
15
|
+
|
16
|
+
spec.files = `git ls-files`.split($/)
|
17
|
+
spec.executables = spec.files.grep(%r{^bin/}) { |f| File.basename(f) }
|
18
|
+
spec.test_files = spec.files.grep(%r{^(test|spec|features)/})
|
19
|
+
spec.require_paths = ["lib"]
|
20
|
+
spec.required_ruby_version = '>= 2.0.0'
|
21
|
+
spec.platform = Gem::Platform::local
|
22
|
+
|
23
|
+
spec.add_development_dependency "bundler", "~> 1.3"
|
24
|
+
spec.add_development_dependency "rake"
|
25
|
+
end
|
Binary file
|
data/test/Data/BIG5.pdat
ADDED
Binary file
|
Binary file
|
Binary file
|
@@ -0,0 +1,15 @@
|
|
1
|
+
<?xmlversion="1.0"encoding="GB2312"?>
|
2
|
+
<NLPIR>
|
3
|
+
<TagSet>ICTPOS.map</TagSet>//���Ա�ע��ӳ���ļ�
|
4
|
+
<UserDict>on</UserDict>//On��UserDictionaryapplied;Off:notapplied��
|
5
|
+
<UserDictPrior>On</UserDictPrior>//�û��ʵ�����,Addedin2006-03-16,requiredbyNECOn���û��ʵ�ͺ��Ĵʵ���ͬʱ�еĴʻ㣬�û��ʵ����ȣ������ܲ�Ҫ���ã���������Ĵʵ��еĴʶ�����Ϊ�û��ʵ䣬��Ч���ʵ��䷴
|
6
|
+
<FieldDict>off</FieldDict>//On��FieldDictionaryapplied;Off:notapplied��
|
7
|
+
<GranularityContorl>off</GranularityContorl>
|
8
|
+
<Log>On</Log>//On,Off�����磺Off:�ر���־���ܣ�On:����־����
|
9
|
+
<version>2013</version>//ϵͳ�汾��
|
10
|
+
<Modify>2012-11-14</Modify>//ϵͳ�����ʱ��
|
11
|
+
<Lexicon>2012-11-14</Lexicon>//�ʵ������ʱ��
|
12
|
+
<adaptive>true</adaptive>//����Ӧ�ִʣ�Ĭ��Ϊfalse������Ӧ�ִʵ�Ч�ʻ�ϵ�
|
13
|
+
<author>�Ż�ƽ��ʿ</author>//����
|
14
|
+
<Contact>pipy_zhang@msn.com</Contact>//������ϵ��ʽ
|
15
|
+
</NLPIR>
|
Binary file
|
Binary file
|
Binary file
|
Binary file
|
Binary file
|
data/test/Data/GBK.pdat
ADDED
Binary file
|
Binary file
|
Binary file
|
Binary file
|
Binary file
|
data/test/Data/GBKA.pdat
ADDED
Binary file
|
Binary file
|
Binary file
|
data/test/Data/GBKC.pdat
ADDED
Binary file
|
Binary file
|
Binary file
|