nlpir 0.0.4-x86-mingw32
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +7 -0
- data/.gitignore +17 -0
- data/LICENSE.txt +22 -0
- data/README.md +195 -0
- data/Rakefile +11 -0
- data/bin/NLPIR.dll +0 -0
- data/lib/Data/BIG2GBK.map +0 -0
- data/lib/Data/BIG5.pdat +0 -0
- data/lib/Data/BIG5.wordlist +0 -0
- data/lib/Data/BiWord.big +0 -0
- data/lib/Data/Configure.xml +15 -0
- data/lib/Data/CoreDict.pdat +0 -0
- data/lib/Data/CoreDict.pos +0 -0
- data/lib/Data/CoreDict.unig +0 -0
- data/lib/Data/FieldDict.pdat +0 -0
- data/lib/Data/FieldDict.pos +0 -0
- data/lib/Data/GBK.pdat +0 -0
- data/lib/Data/GBK.wordlist +0 -0
- data/lib/Data/GBK2BIG.map +0 -0
- data/lib/Data/GBK2GBKC.map +0 -0
- data/lib/Data/GBK2UTF.map +0 -0
- data/lib/Data/GBKA.pdat +0 -0
- data/lib/Data/GBKA.wordlist +0 -0
- data/lib/Data/GBKA2UTF.map +0 -0
- data/lib/Data/GBKC.pdat +0 -0
- data/lib/Data/GBKC.wordlist +0 -0
- data/lib/Data/GBKC2GBK.map +0 -0
- data/lib/Data/GranDict.pdat +3369 -8
- data/lib/Data/GranDict.pos +0 -0
- data/lib/Data/ICTPOS.map +96 -0
- data/lib/Data/NLPIR.ctx +0 -0
- data/lib/Data/NLPIR.user +0 -0
- data/lib/Data/NLPIR_First.map +96 -0
- data/lib/Data/NewWord.lst +25 -0
- data/lib/Data/PKU.map +96 -0
- data/lib/Data/PKU_First.map +96 -0
- data/lib/Data/UTF2GBK.map +0 -0
- data/lib/Data/UTF2GBKA.map +0 -0
- data/lib/Data/UTF8.pdat +0 -0
- data/lib/Data/UTF8.wordlist +0 -0
- data/lib/Data/UserDict.pdat +0 -0
- data/lib/Data/charset.type +0 -0
- data/lib/Data/nr.ctx +0 -0
- data/lib/Data/nr.fsa +0 -0
- data/lib/Data/nr.role +0 -0
- data/lib/nlpir/version.rb +3 -0
- data/lib/nlpir.rb +275 -0
- data/nlpir.gemspec +25 -0
- data/test/Data/BIG2GBK.map +0 -0
- data/test/Data/BIG5.pdat +0 -0
- data/test/Data/BIG5.wordlist +0 -0
- data/test/Data/BiWord.big +0 -0
- data/test/Data/Configure.xml +15 -0
- data/test/Data/CoreDict.pdat +0 -0
- data/test/Data/CoreDict.pos +0 -0
- data/test/Data/CoreDict.unig +0 -0
- data/test/Data/FieldDict.pdat +0 -0
- data/test/Data/FieldDict.pos +0 -0
- data/test/Data/GBK.pdat +0 -0
- data/test/Data/GBK.wordlist +0 -0
- data/test/Data/GBK2BIG.map +0 -0
- data/test/Data/GBK2GBKC.map +0 -0
- data/test/Data/GBK2UTF.map +0 -0
- data/test/Data/GBKA.pdat +0 -0
- data/test/Data/GBKA.wordlist +0 -0
- data/test/Data/GBKA2UTF.map +0 -0
- data/test/Data/GBKC.pdat +0 -0
- data/test/Data/GBKC.wordlist +0 -0
- data/test/Data/GBKC2GBK.map +0 -0
- data/test/Data/GranDict.pdat +3369 -8
- data/test/Data/GranDict.pos +0 -0
- data/test/Data/ICTPOS.map +96 -0
- data/test/Data/NLPIR.ctx +0 -0
- data/test/Data/NLPIR.user +0 -0
- data/test/Data/NLPIR_First.map +96 -0
- data/test/Data/NewWord.lst +73 -0
- data/test/Data/PKU.map +96 -0
- data/test/Data/PKU_First.map +96 -0
- data/test/Data/UTF2GBK.map +0 -0
- data/test/Data/UTF2GBKA.map +0 -0
- data/test/Data/UTF8.pdat +0 -0
- data/test/Data/UTF8.wordlist +0 -0
- data/test/Data/UserDict.pdat +0 -0
- data/test/Data/charset.type +0 -0
- data/test/Data/nr.ctx +0 -0
- data/test/Data/nr.fsa +0 -0
- data/test/Data/nr.role +0 -0
- data/test/test.txt +52 -0
- data/test/test_nlpir.rb +158 -0
- data/test/test_result.txt +87 -0
- data/test/userdict.txt +5 -0
- metadata +206 -0
data/nlpir.gemspec
ADDED
@@ -0,0 +1,25 @@
|
|
1
|
+
# coding: utf-8
|
2
|
+
lib = File.expand_path('../lib', __FILE__)
|
3
|
+
$LOAD_PATH.unshift(lib) unless $LOAD_PATH.include?(lib)
|
4
|
+
require 'nlpir/version'
|
5
|
+
|
6
|
+
Gem::Specification.new do |spec|
|
7
|
+
spec.name = "nlpir"
|
8
|
+
spec.version = Nlpir::VERSION
|
9
|
+
spec.authors = ["JoeWoo"]
|
10
|
+
spec.email = ["0wujian0@gmail.com"]
|
11
|
+
spec.description = %q{"A rubygem wrapper of chinese segment tools ICTCLAS2013"}
|
12
|
+
spec.summary = %q{"ICTCLAS是由中国科学院计算技术研究所研发。中文分词;词性标注;命名实体识别;新词识别;同时支持用户词典。"}
|
13
|
+
spec.homepage = "https://github.com/JoeWoo/nlpir_win"
|
14
|
+
spec.license = "MIT"
|
15
|
+
|
16
|
+
spec.files = `git ls-files`.split($/)
|
17
|
+
spec.executables = spec.files.grep(%r{^bin/}) { |f| File.basename(f) }
|
18
|
+
spec.test_files = spec.files.grep(%r{^(test|spec|features)/})
|
19
|
+
spec.require_paths = ["lib"]
|
20
|
+
spec.required_ruby_version = '>= 2.0.0'
|
21
|
+
spec.platform = Gem::Platform::local
|
22
|
+
|
23
|
+
spec.add_development_dependency "bundler", "~> 1.3"
|
24
|
+
spec.add_development_dependency "rake"
|
25
|
+
end
|
Binary file
|
data/test/Data/BIG5.pdat
ADDED
Binary file
|
Binary file
|
Binary file
|
@@ -0,0 +1,15 @@
|
|
1
|
+
<?xmlversion="1.0"encoding="GB2312"?>
|
2
|
+
<NLPIR>
|
3
|
+
<TagSet>ICTPOS.map</TagSet>//���Ա�ע��ӳ���ļ�
|
4
|
+
<UserDict>on</UserDict>//On��UserDictionaryapplied;Off:notapplied��
|
5
|
+
<UserDictPrior>On</UserDictPrior>//�û��ʵ�����,Addedin2006-03-16,requiredbyNECOn���û��ʵ�ͺ��Ĵʵ���ͬʱ�еĴʻ㣬�û��ʵ����ȣ������ܲ�Ҫ���ã���������Ĵʵ��еĴʶ�����Ϊ�û��ʵ䣬��Ч���ʵ��䷴
|
6
|
+
<FieldDict>off</FieldDict>//On��FieldDictionaryapplied;Off:notapplied��
|
7
|
+
<GranularityContorl>off</GranularityContorl>
|
8
|
+
<Log>On</Log>//On,Off�����磺Off:�ر���־���ܣ�On:����־����
|
9
|
+
<version>2013</version>//ϵͳ�汾��
|
10
|
+
<Modify>2012-11-14</Modify>//ϵͳ�����ʱ��
|
11
|
+
<Lexicon>2012-11-14</Lexicon>//�ʵ������ʱ��
|
12
|
+
<adaptive>true</adaptive>//����Ӧ�ִʣ�Ĭ��Ϊfalse������Ӧ�ִʵ�Ч�ʻ�ϵ�
|
13
|
+
<author>�Ż�ƽ��ʿ</author>//����
|
14
|
+
<Contact>pipy_zhang@msn.com</Contact>//������ϵ��ʽ
|
15
|
+
</NLPIR>
|
Binary file
|
Binary file
|
Binary file
|
Binary file
|
Binary file
|
data/test/Data/GBK.pdat
ADDED
Binary file
|
Binary file
|
Binary file
|
Binary file
|
Binary file
|
data/test/Data/GBKA.pdat
ADDED
Binary file
|
Binary file
|
Binary file
|
data/test/Data/GBKC.pdat
ADDED
Binary file
|
Binary file
|
Binary file
|