amalgalite 1.4.1-x86-mingw32 → 1.7.0-x86-mingw32

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (47) hide show
  1. checksums.yaml +5 -5
  2. data/CONTRIBUTING.md +11 -0
  3. data/HISTORY.md +45 -0
  4. data/LICENSE +2 -0
  5. data/Manifest.txt +2 -1
  6. data/README.md +10 -14
  7. data/Rakefile +5 -5
  8. data/examples/fts5.rb +152 -0
  9. data/ext/amalgalite/c/amalgalite.c +26 -0
  10. data/ext/amalgalite/c/amalgalite_constants.c +1110 -56
  11. data/ext/amalgalite/c/amalgalite_database.c +80 -70
  12. data/ext/amalgalite/c/extconf.rb +31 -4
  13. data/ext/amalgalite/c/gen_constants.rb +313 -153
  14. data/ext/amalgalite/c/sqlite3.c +103967 -33836
  15. data/ext/amalgalite/c/sqlite3.h +5438 -1061
  16. data/ext/amalgalite/c/sqlite3ext.h +148 -12
  17. data/lib/amalgalite/2.2/amalgalite.so +0 -0
  18. data/lib/amalgalite/2.3/amalgalite.so +0 -0
  19. data/lib/amalgalite/2.4/amalgalite.so +0 -0
  20. data/lib/amalgalite/2.5/amalgalite.so +0 -0
  21. data/lib/amalgalite/2.6/amalgalite.so +0 -0
  22. data/lib/amalgalite/aggregate.rb +6 -0
  23. data/lib/amalgalite/csv_table_importer.rb +1 -1
  24. data/lib/amalgalite/database.rb +2 -53
  25. data/lib/amalgalite/profile_tap.rb +2 -2
  26. data/lib/amalgalite/statement.rb +5 -2
  27. data/lib/amalgalite/taps/io.rb +5 -2
  28. data/lib/amalgalite/trace_tap.rb +1 -1
  29. data/lib/amalgalite/type_maps/default_map.rb +2 -2
  30. data/lib/amalgalite/type_maps/storage_map.rb +1 -1
  31. data/lib/amalgalite/version.rb +1 -1
  32. data/spec/aggregate_spec.rb +4 -0
  33. data/spec/database_spec.rb +12 -15
  34. data/spec/default_map_spec.rb +1 -1
  35. data/spec/integeration_spec.rb +2 -2
  36. data/spec/json_spec.rb +24 -0
  37. data/spec/sqlite3/version_spec.rb +15 -9
  38. data/spec/storage_map_spec.rb +1 -1
  39. data/tasks/default.rake +3 -10
  40. data/tasks/extension.rake +4 -4
  41. data/tasks/this.rb +7 -5
  42. metadata +33 -25
  43. data/examples/fts3.rb +0 -144
  44. data/lib/amalgalite/1.8/amalgalite.so +0 -0
  45. data/lib/amalgalite/1.9/amalgalite.so +0 -0
  46. data/lib/amalgalite/2.0/amalgalite.so +0 -0
  47. data/lib/amalgalite/2.1/amalgalite.so +0 -0
@@ -1,144 +0,0 @@
1
- #!/usr/bin/env ruby
2
- require 'rubygems'
3
- require 'amalgalite'
4
- require 'benchmark'
5
-
6
- begin
7
- require 'json'
8
- rescue LoadError
9
- abort "'gem install json' to run this example"
10
- end
11
-
12
-
13
- README = <<_
14
- This example programs assumes that you have downloaded the 'Tweets During the
15
- State of the Union address' dataset from infochimps.com
16
-
17
- http://www.infochimps.com/datasets/tweets-during-state-of-the-union-address
18
-
19
- Please:
20
- 1) download this dataset
21
- 2) bunzip + untar this file
22
- 3) record the location of the 'twitter_stream.txt' file that is in the
23
- tarball.
24
- 4) Pass this file as the first parameter to this script.
25
- _
26
-
27
- twitter_stream = ARGV.shift
28
- abort README unless twitter_stream and File.readable?( twitter_stream )
29
-
30
- #
31
- # Lets create a database that utilizes FTS3 http://www.sqlite.org/fts3.html
32
- #
33
- #
34
-
35
- #
36
- # Create a database, this will create the DB if it doesn't exist
37
- #
38
- puts "Opening database (version #{Amalgalite::Version})"
39
- db = Amalgalite::Database.new("fts3.db")
40
-
41
- #
42
- # Create the schema unless it already exists in the table. The meta information
43
- # about the database schema is available as the result of the db.schema method
44
- #
45
- schema = db.schema
46
- unless schema.tables['search']
47
- puts "Create schema"
48
- db.execute_batch <<-SQL
49
- CREATE VIRTUAL TABLE search USING fts3(
50
- filename VARCHAR(128),
51
- content TEXT
52
- );
53
-
54
- CREATE TABLE plain (
55
- filename VARCHAR(128),
56
- content TEXT
57
- );
58
- SQL
59
- db.reload_schema!
60
- end
61
-
62
- #
63
- # Only load the data if the db is empty
64
- #
65
- if db.first_value_from( "SELECT count(*) from search" ) == 0 then
66
- before = Time.now
67
- #
68
- # Load the tweets from the file passed on the commandline into the database
69
- # We just want the text and the tweet id and insert that into the database.
70
- #
71
-
72
- lines = IO.readlines( twitter_stream )
73
- idx = 0
74
-
75
- # Inserting bulk rows as a transaction is good practice with SQLite, it is
76
- # MUCH faster.
77
- db.transaction do |db_in_transaction|
78
- lines.each do |line|
79
-
80
- # quick little parse of the tweet
81
- json = JSON.parse( line )
82
- insert_data = {}
83
- insert_data[':fname'] = json['id']
84
- insert_data[':content'] = json['text']
85
-
86
- # insert into the FTS3 table
87
- db_in_transaction.prepare("INSERT INTO search( filename, content ) VALUES( :fname, :content );") do |stmt|
88
- stmt.execute( insert_data )
89
- end
90
-
91
- # insert into the normal table for comparison
92
- db_in_transaction.prepare("INSERT INTO plain( filename, content ) VALUES( :fname, :content );") do |stmt|
93
- stmt.execute( insert_data )
94
- end
95
-
96
- idx += 1
97
- print "Processed #{idx} of #{lines.size}\r"
98
- $stdout.flush
99
- end
100
- puts "Finalizing..."
101
- end
102
- puts "Took #{Time.now - before} seconds to insert #{idx} lines of #{lines.size}"
103
- puts "Done Inserting"
104
- end
105
-
106
- doc_count = db.first_value_from( "SELECT count(*) from search" )
107
-
108
- #
109
- # Now lets do some searching for some various words
110
- #
111
-
112
- %w[ president salmon thanks ].each do |word|
113
-
114
- count = 100
115
- puts
116
- puts "Searching for '#{word}' across #{doc_count} tweets"
117
- puts "=" * 60
118
-
119
- Benchmark.bm( 15 ) do |x|
120
-
121
- #
122
- # search using the fts search to get the cont of tweets with the given word
123
- #
124
- x.report('fts3: ') do
125
- db.prepare( "SELECT count(filename) FROM search WHERE content MATCH '#{word}'" ) do |stmt|
126
- count.times do
127
- stmt.execute
128
- end
129
- end
130
- end
131
-
132
- #
133
- # search using basic string matching in sqlite.
134
- #
135
- x.report('plain: ') do
136
- db.prepare( "SELECT count(filename) FROM plain WHERE content LIKE '% #{word} %'" ) do |stmt|
137
- count.times do
138
- stmt.execute
139
- end
140
- end
141
- end
142
- end
143
- end
144
-