te_rex 0.1.1 → 0.1.2

Sign up to get free protection for your applications and to get access to all the features.
checksums.yaml CHANGED
@@ -1,7 +1,7 @@
1
1
  ---
2
2
  SHA1:
3
- metadata.gz: bae6e503a7f674b25ede59c7f9ef1c5de54b6a78
4
- data.tar.gz: 71e7da095d199a9bc51419a3432912fb461b23c4
3
+ metadata.gz: 8fb50481c19a00e2bebb447eafb28f9ea5371978
4
+ data.tar.gz: b9aa26933ab953af6a5949dd333c52ad9e04dda4
5
5
  SHA512:
6
- metadata.gz: 84220db22732d965161f8e677662b4cb9392f02762d4cf89ef027cdf9622fdc10f8eb26fea72e91301151f6fe24cc71a09029b4d31c77a753b5f8005bfff1868
7
- data.tar.gz: 3fb8d3e66ff969b967075d13a898b8a12e81c5456996e890cb77fe6b21ed076be59d4749ca3d3715d429a298cc48969b516ccfc42548fd51f700bd638dc9aada
6
+ metadata.gz: f3c6a665de08e840db3bb23cfb9465bc3a84f9371ff325fdc01373936029fcc8b73441d2237b8fce4140d5aacfbb4b2796528804a6acd736370377a144044f56
7
+ data.tar.gz: 72b95f6e90af40b1ab3797e1b82afe9fe76432bedaa81adcea10a3eba48aa4b64ecb36e2ed4e083730bf51fa4019f671d518e6ea29f581db95d2f5cdeb980193
@@ -1,126 +1,124 @@
1
1
  module TeRex
2
2
  class StopWord
3
- LIST = [
4
- @enterprise && @dates_times && @connector
5
- ].uniq
6
3
 
7
- @enterprise = [
8
- "-", #bayes_data should handle this but coming through: look at stemmer.
9
- "amadeus",
10
- "ean",
11
- "error",
12
- "expedia",
13
- "java",
14
- "json",
15
- "orbitz",
16
- "priceline",
17
- "sabre",
18
- "travelocity",
19
- "xml",
20
- "xmlst",
21
- "xmlws"
22
- ]
23
- @dates_times = [
24
- "january",
25
- "february",
26
- "march",
27
- "april",
28
- "may",
29
- "june",
30
- "july",
31
- "august",
32
- "september",
33
- "october",
34
- "november",
35
- "december",
36
- "jan",
37
- "feb",
38
- "mar",
39
- "apr",
40
- "aug",
41
- "sept",
42
- "nov",
43
- "dec",
44
- "monday",
45
- "mon",
46
- "tuesday",
47
- "tue",
48
- "wednesday",
49
- "wed",
50
- "thursday",
51
- "thur",
52
- "friday",
53
- "fri",
54
- "saturday",
55
- "sat",
56
- "sunday",
57
- "sun",
58
- "pm",
59
- "am",
60
- "0",
61
- "1",
62
- "2",
63
- "3",
64
- "4",
65
- "5",
66
- "6",
67
- "7",
68
- "8",
69
- "9"
70
- ]
71
- @connector = [
72
- "a",
73
- "all",
74
- "am",
75
- "an",
76
- "and",
77
- "are",
78
- "as",
79
- "at",
80
- "be",
81
- "been",
82
- "by",
83
- "can",
84
- "do",
85
- "does",
86
- "doesn't",
87
- "for",
88
- "get",
89
- "has",
90
- "hotel",
91
- "in",
92
- "into",
93
- "is",
94
- "it",
95
- "it's",
96
- "its",
97
- "of",
98
- "on",
99
- "or",
100
- "so",
101
- "sorry",
102
- "than",
103
- "that",
104
- "that's",
105
- "this",
106
- "the",
107
- "there",
108
- "their",
109
- "to",
110
- "us",
111
- "was",
112
- "we",
113
- "we're",
114
- "were",
115
- "what",
116
- "what's",
117
- "where",
118
- "when",
119
- "which",
120
- "with",
121
- "you",
122
- "you've"
123
- ]
4
+ ENTERPRISE = [
5
+ "-", #bayes_data should handle this but coming through: look at stemmer.
6
+ "amadeus",
7
+ "ean",
8
+ "error",
9
+ "expedia",
10
+ "java",
11
+ "json",
12
+ "orbitz",
13
+ "priceline",
14
+ "sabre",
15
+ "travelocity",
16
+ "xml",
17
+ "xmlst",
18
+ "xmlws"
19
+ ]
20
+ DATES_TIMES = [
21
+ "january",
22
+ "february",
23
+ "march",
24
+ "april",
25
+ "may",
26
+ "june",
27
+ "july",
28
+ "august",
29
+ "september",
30
+ "october",
31
+ "november",
32
+ "december",
33
+ "jan",
34
+ "feb",
35
+ "mar",
36
+ "apr",
37
+ "aug",
38
+ "sept",
39
+ "nov",
40
+ "dec",
41
+ "monday",
42
+ "mon",
43
+ "tuesday",
44
+ "tue",
45
+ "wednesday",
46
+ "wed",
47
+ "thursday",
48
+ "thur",
49
+ "friday",
50
+ "fri",
51
+ "saturday",
52
+ "sat",
53
+ "sunday",
54
+ "sun",
55
+ "pm",
56
+ "am",
57
+ "0",
58
+ "1",
59
+ "2",
60
+ "3",
61
+ "4",
62
+ "5",
63
+ "6",
64
+ "7",
65
+ "8",
66
+ "9"
67
+ ]
68
+ CONNECTOR = [
69
+ "a",
70
+ "all",
71
+ "am",
72
+ "an",
73
+ "and",
74
+ "are",
75
+ "as",
76
+ "at",
77
+ "be",
78
+ "been",
79
+ "by",
80
+ "can",
81
+ "do",
82
+ "does",
83
+ "doesn't",
84
+ "for",
85
+ "get",
86
+ "has",
87
+ "hotel",
88
+ "in",
89
+ "into",
90
+ "is",
91
+ "it",
92
+ "it's",
93
+ "its",
94
+ "of",
95
+ "on",
96
+ "or",
97
+ "so",
98
+ "sorry",
99
+ "than",
100
+ "that",
101
+ "that's",
102
+ "this",
103
+ "the",
104
+ "there",
105
+ "their",
106
+ "to",
107
+ "us",
108
+ "was",
109
+ "we",
110
+ "we're",
111
+ "were",
112
+ "what",
113
+ "what's",
114
+ "where",
115
+ "when",
116
+ "which",
117
+ "with",
118
+ "you",
119
+ "you've"
120
+ ]
124
121
 
122
+ LIST = ENTERPRISE + DATES_TIMES + CONNECTOR
125
123
  end
126
124
  end
@@ -1,3 +1,3 @@
1
1
  module TeRex
2
- VERSION = "0.1.1"
2
+ VERSION = "0.1.2"
3
3
  end
metadata CHANGED
@@ -1,7 +1,7 @@
1
1
  --- !ruby/object:Gem::Specification
2
2
  name: te_rex
3
3
  version: !ruby/object:Gem::Version
4
- version: 0.1.1
4
+ version: 0.1.2
5
5
  platform: ruby
6
6
  authors:
7
7
  - Joshua Bowles