te_rex 0.1.1 → 0.1.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
checksums.yaml CHANGED
@@ -1,7 +1,7 @@
1
1
  ---
2
2
  SHA1:
3
- metadata.gz: bae6e503a7f674b25ede59c7f9ef1c5de54b6a78
4
- data.tar.gz: 71e7da095d199a9bc51419a3432912fb461b23c4
3
+ metadata.gz: 8fb50481c19a00e2bebb447eafb28f9ea5371978
4
+ data.tar.gz: b9aa26933ab953af6a5949dd333c52ad9e04dda4
5
5
  SHA512:
6
- metadata.gz: 84220db22732d965161f8e677662b4cb9392f02762d4cf89ef027cdf9622fdc10f8eb26fea72e91301151f6fe24cc71a09029b4d31c77a753b5f8005bfff1868
7
- data.tar.gz: 3fb8d3e66ff969b967075d13a898b8a12e81c5456996e890cb77fe6b21ed076be59d4749ca3d3715d429a298cc48969b516ccfc42548fd51f700bd638dc9aada
6
+ metadata.gz: f3c6a665de08e840db3bb23cfb9465bc3a84f9371ff325fdc01373936029fcc8b73441d2237b8fce4140d5aacfbb4b2796528804a6acd736370377a144044f56
7
+ data.tar.gz: 72b95f6e90af40b1ab3797e1b82afe9fe76432bedaa81adcea10a3eba48aa4b64ecb36e2ed4e083730bf51fa4019f671d518e6ea29f581db95d2f5cdeb980193
@@ -1,126 +1,124 @@
1
1
  module TeRex
2
2
  class StopWord
3
- LIST = [
4
- @enterprise && @dates_times && @connector
5
- ].uniq
6
3
 
7
- @enterprise = [
8
- "-", #bayes_data should handle this but coming through: look at stemmer.
9
- "amadeus",
10
- "ean",
11
- "error",
12
- "expedia",
13
- "java",
14
- "json",
15
- "orbitz",
16
- "priceline",
17
- "sabre",
18
- "travelocity",
19
- "xml",
20
- "xmlst",
21
- "xmlws"
22
- ]
23
- @dates_times = [
24
- "january",
25
- "february",
26
- "march",
27
- "april",
28
- "may",
29
- "june",
30
- "july",
31
- "august",
32
- "september",
33
- "october",
34
- "november",
35
- "december",
36
- "jan",
37
- "feb",
38
- "mar",
39
- "apr",
40
- "aug",
41
- "sept",
42
- "nov",
43
- "dec",
44
- "monday",
45
- "mon",
46
- "tuesday",
47
- "tue",
48
- "wednesday",
49
- "wed",
50
- "thursday",
51
- "thur",
52
- "friday",
53
- "fri",
54
- "saturday",
55
- "sat",
56
- "sunday",
57
- "sun",
58
- "pm",
59
- "am",
60
- "0",
61
- "1",
62
- "2",
63
- "3",
64
- "4",
65
- "5",
66
- "6",
67
- "7",
68
- "8",
69
- "9"
70
- ]
71
- @connector = [
72
- "a",
73
- "all",
74
- "am",
75
- "an",
76
- "and",
77
- "are",
78
- "as",
79
- "at",
80
- "be",
81
- "been",
82
- "by",
83
- "can",
84
- "do",
85
- "does",
86
- "doesn't",
87
- "for",
88
- "get",
89
- "has",
90
- "hotel",
91
- "in",
92
- "into",
93
- "is",
94
- "it",
95
- "it's",
96
- "its",
97
- "of",
98
- "on",
99
- "or",
100
- "so",
101
- "sorry",
102
- "than",
103
- "that",
104
- "that's",
105
- "this",
106
- "the",
107
- "there",
108
- "their",
109
- "to",
110
- "us",
111
- "was",
112
- "we",
113
- "we're",
114
- "were",
115
- "what",
116
- "what's",
117
- "where",
118
- "when",
119
- "which",
120
- "with",
121
- "you",
122
- "you've"
123
- ]
4
+ ENTERPRISE = [
5
+ "-", #bayes_data should handle this but coming through: look at stemmer.
6
+ "amadeus",
7
+ "ean",
8
+ "error",
9
+ "expedia",
10
+ "java",
11
+ "json",
12
+ "orbitz",
13
+ "priceline",
14
+ "sabre",
15
+ "travelocity",
16
+ "xml",
17
+ "xmlst",
18
+ "xmlws"
19
+ ]
20
+ DATES_TIMES = [
21
+ "january",
22
+ "february",
23
+ "march",
24
+ "april",
25
+ "may",
26
+ "june",
27
+ "july",
28
+ "august",
29
+ "september",
30
+ "october",
31
+ "november",
32
+ "december",
33
+ "jan",
34
+ "feb",
35
+ "mar",
36
+ "apr",
37
+ "aug",
38
+ "sept",
39
+ "nov",
40
+ "dec",
41
+ "monday",
42
+ "mon",
43
+ "tuesday",
44
+ "tue",
45
+ "wednesday",
46
+ "wed",
47
+ "thursday",
48
+ "thur",
49
+ "friday",
50
+ "fri",
51
+ "saturday",
52
+ "sat",
53
+ "sunday",
54
+ "sun",
55
+ "pm",
56
+ "am",
57
+ "0",
58
+ "1",
59
+ "2",
60
+ "3",
61
+ "4",
62
+ "5",
63
+ "6",
64
+ "7",
65
+ "8",
66
+ "9"
67
+ ]
68
+ CONNECTOR = [
69
+ "a",
70
+ "all",
71
+ "am",
72
+ "an",
73
+ "and",
74
+ "are",
75
+ "as",
76
+ "at",
77
+ "be",
78
+ "been",
79
+ "by",
80
+ "can",
81
+ "do",
82
+ "does",
83
+ "doesn't",
84
+ "for",
85
+ "get",
86
+ "has",
87
+ "hotel",
88
+ "in",
89
+ "into",
90
+ "is",
91
+ "it",
92
+ "it's",
93
+ "its",
94
+ "of",
95
+ "on",
96
+ "or",
97
+ "so",
98
+ "sorry",
99
+ "than",
100
+ "that",
101
+ "that's",
102
+ "this",
103
+ "the",
104
+ "there",
105
+ "their",
106
+ "to",
107
+ "us",
108
+ "was",
109
+ "we",
110
+ "we're",
111
+ "were",
112
+ "what",
113
+ "what's",
114
+ "where",
115
+ "when",
116
+ "which",
117
+ "with",
118
+ "you",
119
+ "you've"
120
+ ]
124
121
 
122
+ LIST = ENTERPRISE + DATES_TIMES + CONNECTOR
125
123
  end
126
124
  end
@@ -1,3 +1,3 @@
1
1
  module TeRex
2
- VERSION = "0.1.1"
2
+ VERSION = "0.1.2"
3
3
  end
metadata CHANGED
@@ -1,7 +1,7 @@
1
1
  --- !ruby/object:Gem::Specification
2
2
  name: te_rex
3
3
  version: !ruby/object:Gem::Version
4
- version: 0.1.1
4
+ version: 0.1.2
5
5
  platform: ruby
6
6
  authors:
7
7
  - Joshua Bowles