bigindex-solr 1.2.0

Sign up to get free protection for your applications and to get access to all the features.
Files changed (100) hide show
  1. data/.document +5 -0
  2. data/.gitignore +8 -0
  3. data/MIT-LICENSE +20 -0
  4. data/README.rdoc +73 -0
  5. data/Rakefile +49 -0
  6. data/VERSION +1 -0
  7. data/bigindex-solr.gemspec +141 -0
  8. data/examples/bigindex.yml +9 -0
  9. data/install.rb +17 -0
  10. data/lib/bigindex-solr.rb +32 -0
  11. data/lib/bigindex-solr/tasks.rb +3 -0
  12. data/lib/tasks/bigindex_solr.rake +55 -0
  13. data/schema.xml +126 -0
  14. data/solr/CHANGES.txt +562 -0
  15. data/solr/LICENSE.txt +608 -0
  16. data/solr/NOTICE.txt +57 -0
  17. data/solr/etc/jetty.xml +206 -0
  18. data/solr/etc/webdefault.xml +379 -0
  19. data/solr/lib/commons-codec-1.3.jar +0 -0
  20. data/solr/lib/commons-csv-0.1-SNAPSHOT.jar +0 -0
  21. data/solr/lib/commons-fileupload-1.2.jar +0 -0
  22. data/solr/lib/commons-io-1.2.jar +0 -0
  23. data/solr/lib/easymock.jar +0 -0
  24. data/solr/lib/jetty-6.1.3.jar +0 -0
  25. data/solr/lib/jetty-util-6.1.3.jar +0 -0
  26. data/solr/lib/jsp-2.1/ant-1.6.5.jar +0 -0
  27. data/solr/lib/jsp-2.1/core-3.1.1.jar +0 -0
  28. data/solr/lib/jsp-2.1/jsp-2.1.jar +0 -0
  29. data/solr/lib/jsp-2.1/jsp-api-2.1.jar +0 -0
  30. data/solr/lib/lucene-analyzers-2007-05-20_00-04-53.jar +0 -0
  31. data/solr/lib/lucene-core-2007-05-20_00-04-53.jar +0 -0
  32. data/solr/lib/lucene-highlighter-2007-05-20_00-04-53.jar +0 -0
  33. data/solr/lib/lucene-snowball-2007-05-20_00-04-53.jar +0 -0
  34. data/solr/lib/lucene-spellchecker-2007-05-20_00-04-53.jar +0 -0
  35. data/solr/lib/servlet-api-2.4.jar +0 -0
  36. data/solr/lib/servlet-api-2.5-6.1.3.jar +0 -0
  37. data/solr/lib/xpp3-1.1.3.4.O.jar +0 -0
  38. data/solr/solr/README.txt +52 -0
  39. data/solr/solr/bin/abc +176 -0
  40. data/solr/solr/bin/abo +176 -0
  41. data/solr/solr/bin/backup +108 -0
  42. data/solr/solr/bin/backupcleaner +142 -0
  43. data/solr/solr/bin/commit +128 -0
  44. data/solr/solr/bin/optimize +129 -0
  45. data/solr/solr/bin/readercycle +129 -0
  46. data/solr/solr/bin/rsyncd-disable +77 -0
  47. data/solr/solr/bin/rsyncd-enable +76 -0
  48. data/solr/solr/bin/rsyncd-start +145 -0
  49. data/solr/solr/bin/rsyncd-stop +105 -0
  50. data/solr/solr/bin/scripts-util +83 -0
  51. data/solr/solr/bin/snapcleaner +148 -0
  52. data/solr/solr/bin/snapinstaller +168 -0
  53. data/solr/solr/bin/snappuller +248 -0
  54. data/solr/solr/bin/snappuller-disable +77 -0
  55. data/solr/solr/bin/snappuller-enable +77 -0
  56. data/solr/solr/bin/snapshooter +109 -0
  57. data/solr/solr/conf/admin-extra.html +31 -0
  58. data/solr/solr/conf/protwords.txt +21 -0
  59. data/solr/solr/conf/schema.xml +126 -0
  60. data/solr/solr/conf/scripts.conf +24 -0
  61. data/solr/solr/conf/solrconfig.xml +458 -0
  62. data/solr/solr/conf/stopwords.txt +57 -0
  63. data/solr/solr/conf/synonyms.txt +31 -0
  64. data/solr/solr/conf/xslt/example.xsl +132 -0
  65. data/solr/solr/conf/xslt/example_atom.xsl +63 -0
  66. data/solr/solr/conf/xslt/example_rss.xsl +62 -0
  67. data/solr/solr/data/development/index/_a.fdt +0 -0
  68. data/solr/solr/data/development/index/_a.fdx +0 -0
  69. data/solr/solr/data/development/index/_a.fnm +2 -0
  70. data/solr/solr/data/development/index/_a.frq +1 -0
  71. data/solr/solr/data/development/index/_a.nrm +1 -0
  72. data/solr/solr/data/development/index/_a.prx +0 -0
  73. data/solr/solr/data/development/index/_a.tii +0 -0
  74. data/solr/solr/data/development/index/_a.tis +0 -0
  75. data/solr/solr/data/development/index/_a_1.del +0 -0
  76. data/solr/solr/data/development/index/_b.fdt +0 -0
  77. data/solr/solr/data/development/index/_b.fdx +0 -0
  78. data/solr/solr/data/development/index/_b.fnm +2 -0
  79. data/solr/solr/data/development/index/_b.frq +0 -0
  80. data/solr/solr/data/development/index/_b.nrm +1 -0
  81. data/solr/solr/data/development/index/_b.prx +0 -0
  82. data/solr/solr/data/development/index/_b.tii +0 -0
  83. data/solr/solr/data/development/index/_b.tis +0 -0
  84. data/solr/solr/data/development/index/_b_1.del +0 -0
  85. data/solr/solr/data/development/index/_c.fdt +0 -0
  86. data/solr/solr/data/development/index/_c.fdx +0 -0
  87. data/solr/solr/data/development/index/_c.fnm +2 -0
  88. data/solr/solr/data/development/index/_c.frq +1 -0
  89. data/solr/solr/data/development/index/_c.nrm +1 -0
  90. data/solr/solr/data/development/index/_c.prx +0 -0
  91. data/solr/solr/data/development/index/_c.tii +0 -0
  92. data/solr/solr/data/development/index/_c.tis +0 -0
  93. data/solr/solr/data/development/index/_c_1.del +0 -0
  94. data/solr/solr/data/development/index/segments.gen +0 -0
  95. data/solr/solr/data/development/index/segments_q +0 -0
  96. data/solr/start.jar +0 -0
  97. data/solr/webapps/solr.war +0 -0
  98. data/spec/bigindex-solr_spec.rb +7 -0
  99. data/spec/spec_helper.rb +9 -0
  100. metadata +163 -0
Binary file
Binary file
Binary file
Binary file
Binary file
Binary file
Binary file
Binary file
Binary file
Binary file
Binary file
Binary file
Binary file
@@ -0,0 +1,52 @@
1
+ # Licensed to the Apache Software Foundation (ASF) under one or more
2
+ # contributor license agreements. See the NOTICE file distributed with
3
+ # this work for additional information regarding copyright ownership.
4
+ # The ASF licenses this file to You under the Apache License, Version 2.0
5
+ # (the "License"); you may not use this file except in compliance with
6
+ # the License. You may obtain a copy of the License at
7
+ #
8
+ # http://www.apache.org/licenses/LICENSE-2.0
9
+ #
10
+ # Unless required by applicable law or agreed to in writing, software
11
+ # distributed under the License is distributed on an "AS IS" BASIS,
12
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
+ # See the License for the specific language governing permissions and
14
+ # limitations under the License.
15
+
16
+
17
+ Example "Solr Home" Directory
18
+ =============================
19
+
20
+ This directory is provided as an example of what a "Solr Home" directory
21
+ should look like.
22
+
23
+ It's not strictly necessary that you copy all of the files in this
24
+ directory when setting up a new instance of Solr, but it is recommended.
25
+
26
+
27
+ Basic Directory Structure
28
+ -------------------------
29
+
30
+ The Solr Home directory typically contains the following subdirectories...
31
+
32
+ conf/
33
+ This directory is mandatory and must contain your solrconfig.xml
34
+ and schema.xml. Any other optional configuration files would also
35
+ be kept here.
36
+
37
+ data/
38
+ This directory is the default location where Solr will keep your
39
+ index, and is used by the replication scripts for dealing with
40
+ snapshots. You can override this location in the solrconfig.xml
41
+ and scripts.conf files. Solr will create this directory if it
42
+ does not already exist.
43
+
44
+ lib/
45
+ This directory is optional. If it exists, Solr will load any Jars
46
+ found in this directory and use them to resolve any "plugins"
47
+ specified in your solrconfig.xml or schema.xml (ie: Analyzers,
48
+ Request Handlers, etc...)
49
+
50
+ bin/
51
+ This directory is optional. It is the default location used for
52
+ keeping the replication scripts.
data/solr/solr/bin/abc ADDED
@@ -0,0 +1,176 @@
1
+ #!/bin/bash
2
+ #
3
+ # Licensed to the Apache Software Foundation (ASF) under one or more
4
+ # contributor license agreements. See the NOTICE file distributed with
5
+ # this work for additional information regarding copyright ownership.
6
+ # The ASF licenses this file to You under the Apache License, Version 2.0
7
+ # (the "License"); you may not use this file except in compliance with
8
+ # the License. You may obtain a copy of the License at
9
+ #
10
+ # http://www.apache.org/licenses/LICENSE-2.0
11
+ #
12
+ # Unless required by applicable law or agreed to in writing, software
13
+ # distributed under the License is distributed on an "AS IS" BASIS,
14
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
15
+ # See the License for the specific language governing permissions and
16
+ # limitations under the License.
17
+ #
18
+ # Shell script to make an Atomic Backup after Commit of
19
+ # a Solr Lucene collection.
20
+
21
+ orig_dir=$(pwd)
22
+ cd ${0%/*}/..
23
+ solr_root=$(pwd)
24
+ cd ${orig_dir}
25
+ curl_url=""
26
+
27
+ unset solr_hostname solr_port data_dir webapp_name user verbose debug solr_url
28
+ . ${solr_root}/bin/scripts-util
29
+
30
+ # set up variables
31
+ prog=${0##*/}
32
+ log=${solr_root}/logs/${prog}.log
33
+
34
+ # define usage string
35
+ USAGE="\
36
+ usage: $prog [-h hostname] [-p port] [-d dir] [-w webappname] [-u username] [-U url] [-v] [-V]
37
+ -h specify Solr hostname (defaults to localhost)
38
+ -p specify Solr port number
39
+ -w specify name of Solr webapp (defaults to solr)
40
+ -u specify user to sudo to before running script
41
+ -U specify full update url (overrides -h,-p,-w parameters)
42
+ -d specify directory holding index data
43
+ -v increase verbosity
44
+ -V output debugging info
45
+ "
46
+
47
+ # parse args
48
+ while getopts h:p:d:w:u:U:vV OPTION
49
+ do
50
+ case $OPTION in
51
+ h)
52
+ solr_hostname="$OPTARG"
53
+ ;;
54
+ p)
55
+ solr_port="$OPTARG"
56
+ ;;
57
+ d)
58
+ data_dir="$OPTARG"
59
+ ;;
60
+ w)
61
+ webapp_name="$OPTARG"
62
+ ;;
63
+ u)
64
+ user="$OPTARG"
65
+ ;;
66
+ U)
67
+ solr_url="$OPTARG"
68
+ ;;
69
+ v)
70
+ verbose="v"
71
+ ;;
72
+ V)
73
+ debug="V"
74
+ ;;
75
+ *)
76
+ echo "$USAGE"
77
+ exit 1
78
+ esac
79
+ done
80
+
81
+ [[ -n $debug ]] && set -x
82
+
83
+ # use default value for data_dir if not specified
84
+ # relative path starts at ${solr_root}
85
+ if [[ -z ${data_dir} ]]
86
+ then
87
+ data_dir=${solr_root}/data
88
+ elif [[ "`echo ${data_dir}|cut -c1`" != "/" ]]
89
+ then
90
+ data_dir=${solr_root}/${data_dir}
91
+ fi
92
+
93
+ if [[ -n ${solr_url} ]]
94
+ then
95
+ curl_url=${solr_url}
96
+ else
97
+ if [[ -z ${solr_port} ]]
98
+ then
99
+ echo "Solr port number missing in $confFile or command line."
100
+ echo "$USAGE"
101
+ exit 1
102
+ fi
103
+
104
+ # use default hostname if not specified
105
+ if [[ -z ${solr_hostname} ]]
106
+ then
107
+ solr_hostname=localhost
108
+ fi
109
+
110
+ # use default webapp name if not specified
111
+ if [[ -z ${webapp_name} ]]
112
+ then
113
+ webapp_name=solr
114
+ fi
115
+ curl_url=http://${solr_hostname}:${solr_port}/${webapp_name}/update
116
+ fi
117
+
118
+ fixUser "$@"
119
+
120
+ start=`date +"%s"`
121
+
122
+ logMessage started by $oldwhoami
123
+ logMessage command: $0 $@
124
+
125
+ logMessage sending commit to Solr server at ${curl_url}
126
+ rs=`curl ${curl_url} -s -H 'Content-type:text/xml; charset=utf-8' -d "<commit/>"`
127
+ if [[ $? != 0 ]]
128
+ then
129
+ logMessage failed to connect to Solr server at ${curl_url}
130
+ logMessage commit failed
131
+ logExit failed 1
132
+ fi
133
+
134
+ # check status of commit request
135
+ echo $rs | grep '<result.*status="0"' > /dev/null 2>&1
136
+ if [[ $? != 0 ]]
137
+ then
138
+ logMessage commit request to Solr at ${curl_url} failed:
139
+ logMessage $rs
140
+ logExit failed 2
141
+ fi
142
+
143
+ # successful commit creates a snapshot file synchronously
144
+ lastsnap=`ls -drt1 ${data_dir}/snapshot.* 2> /dev/null | tail -1 `
145
+
146
+ if [[ $lastsnap == "" ]]
147
+ then
148
+ logMessage commit did not create snapshot at ${curl_url}, backup failed:
149
+ logExit failed 3
150
+ fi
151
+
152
+ name=backup.${lastsnap##*snapshot.}
153
+ temp=temp-${name}
154
+
155
+ if [[ -d ${data_dir}/${name} ]]
156
+ then
157
+ logMessage backup directory ${data_dir}/${name} already exists
158
+ logExit aborted 1
159
+ fi
160
+
161
+ if [[ -d ${data_dir}/${temp} ]]
162
+ then
163
+ logMessage backingup of ${data_dir}/${name} in progress
164
+ logExit aborted 1
165
+ fi
166
+ logMessage making backup ${data_dir}/${name}
167
+
168
+ # clean up after INT/TERM
169
+ trap 'echo cleaning up, please wait ...;/bin/rm -rf ${data_dir}/${name} ${data_dir}/${temp};logExit aborted 13' INT TERM
170
+
171
+ # make a backup using hard links into temporary location
172
+ # then move it into place atomically
173
+ cp -lr ${lastsnap} ${data_dir}/${temp}
174
+ mv ${data_dir}/${temp} ${data_dir}/${name}
175
+
176
+ logExit ended 0
data/solr/solr/bin/abo ADDED
@@ -0,0 +1,176 @@
1
+ #!/bin/bash
2
+ #
3
+ # Licensed to the Apache Software Foundation (ASF) under one or more
4
+ # contributor license agreements. See the NOTICE file distributed with
5
+ # this work for additional information regarding copyright ownership.
6
+ # The ASF licenses this file to You under the Apache License, Version 2.0
7
+ # (the "License"); you may not use this file except in compliance with
8
+ # the License. You may obtain a copy of the License at
9
+ #
10
+ # http://www.apache.org/licenses/LICENSE-2.0
11
+ #
12
+ # Unless required by applicable law or agreed to in writing, software
13
+ # distributed under the License is distributed on an "AS IS" BASIS,
14
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
15
+ # See the License for the specific language governing permissions and
16
+ # limitations under the License.
17
+ #
18
+ # Shell script to make an Atomic Backup after Optimize of
19
+ # a Solr Lucene collection.
20
+
21
+ orig_dir=$(pwd)
22
+ cd ${0%/*}/..
23
+ solr_root=$(pwd)
24
+ cd ${orig_dir}
25
+ curl_url=""
26
+
27
+ unset solr_hostname solr_port data_dir webapp_name user verbose debug solr_url
28
+ . ${solr_root}/bin/scripts-util
29
+
30
+ # set up variables
31
+ prog=${0##*/}
32
+ log=${solr_root}/logs/${prog}.log
33
+
34
+ # define usage string
35
+ USAGE="\
36
+ usage: $prog [-h hostname] [-p port] [-d dir] [-w webapp_name] [-u username] [-U url] [-v] [-V]
37
+ -h specify Solr hostname (defaults to localhost)
38
+ -p specify Solr port number
39
+ -w specify name of Solr webapp (defaults to solr)
40
+ -u specify user to sudo to before running script
41
+ -U specify full update url (overrides -h,-p,-w parameters)
42
+ -d specify directory holding index data (defaults to data)
43
+ -v increase verbosity
44
+ -V output debugging info
45
+ "
46
+
47
+ # parse args
48
+ while getopts h:p:d:w:u:U:vV OPTION
49
+ do
50
+ case $OPTION in
51
+ h)
52
+ solr_hostname="$OPTARG"
53
+ ;;
54
+ p)
55
+ solr_port="$OPTARG"
56
+ ;;
57
+ d)
58
+ data_dir="$OPTARG"
59
+ ;;
60
+ w)
61
+ webapp_name="$OPTARG"
62
+ ;;
63
+ u)
64
+ user="$OPTARG"
65
+ ;;
66
+ U)
67
+ solr_url="$OPTARG"
68
+ ;;
69
+ v)
70
+ verbose="v"
71
+ ;;
72
+ V)
73
+ debug="V"
74
+ ;;
75
+ *)
76
+ echo "$USAGE"
77
+ exit 1
78
+ esac
79
+ done
80
+
81
+ [[ -n $debug ]] && set -x
82
+
83
+ # use default value for data_dir if not specified
84
+ # relative path starts at ${solr_root}
85
+ if [[ -z ${data_dir} ]]
86
+ then
87
+ data_dir=${solr_root}/data
88
+ elif [[ "`echo ${data_dir}|cut -c1`" != "/" ]]
89
+ then
90
+ data_dir=${solr_root}/${data_dir}
91
+ fi
92
+
93
+ if [[ -n ${solr_url} ]]
94
+ then
95
+ curl_url=${solr_url}
96
+ else
97
+ if [[ -z ${solr_port} ]]
98
+ then
99
+ echo "Solr port number missing in $confFile or command line."
100
+ echo "$USAGE"
101
+ exit 1
102
+ fi
103
+
104
+ # use default hostname if not specified
105
+ if [[ -z ${solr_hostname} ]]
106
+ then
107
+ solr_hostname=localhost
108
+ fi
109
+
110
+ # use default webapp name if not specified
111
+ if [[ -z ${webapp_name} ]]
112
+ then
113
+ webapp_name=solr
114
+ fi
115
+ curl_url=http://${solr_hostname}:${solr_port}/${webapp_name}/update
116
+ fi
117
+
118
+ fixUser "$@"
119
+
120
+ start=`date +"%s"`
121
+
122
+ logMessage started by $oldwhoami
123
+ logMessage command: $0 $@
124
+
125
+ logMessage sending optimize to Solr server at ${curl_url}
126
+ rs=`curl ${curl_url} -s -H 'Content-type:text/xml; charset=utf-8' -d "<optimize/>"`
127
+ if [[ $? != 0 ]]
128
+ then
129
+ logMessage failed to connect to Solr server at ${curl_url}
130
+ logMessage optimize failed
131
+ logExit failed 1
132
+ fi
133
+
134
+ # check status of optimize request
135
+ echo $rs | grep '<result.*status="0"' > /dev/null 2>&1
136
+ if [[ $? != 0 ]]
137
+ then
138
+ logMessage optimize request to Solr at ${curl_url} failed:
139
+ logMessage $rs
140
+ logExit failed 2
141
+ fi
142
+
143
+ # successful optimize creates a snapshot file synchronously
144
+ lastsnap=`ls -drt1 ${data_dir}/snapshot.* | tail -1 `
145
+
146
+ if [[ $lastsnap == "" ]]
147
+ then
148
+ logMessage commit did not create snapshot at ${curl_url}, backup failed:
149
+ logExit failed 3
150
+ fi
151
+
152
+ name=backup.${lastsnap##*snapshot.}
153
+ temp=temp-${name}
154
+
155
+ if [[ -d ${data_dir}/${name} ]]
156
+ then
157
+ logMessage backup directory ${data_dir}/${name} already exists
158
+ logExit aborted 1
159
+ fi
160
+
161
+ if [[ -d ${data_dir}/${temp} ]]
162
+ then
163
+ logMessage backingup of ${data_dir}/${name} in progress
164
+ logExit aborted 1
165
+ fi
166
+ logMessage making backup ${data_dir}/${name}
167
+
168
+ # clean up after INT/TERM
169
+ trap 'echo cleaning up, please wait ...;/bin/rm -rf ${data_dir}/${name} ${data_dir}/${temp};logExit aborted 13' INT TERM
170
+
171
+ # make a backup using hard links into temporary location
172
+ # then move it into place atomically
173
+ cp -lr ${lastsnap} ${data_dir}/${temp}
174
+ mv ${data_dir}/${temp} ${data_dir}/${name}
175
+
176
+ logExit ended 0