perobs 2.5.0 → 3.0.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/lib/perobs/Array.rb +1 -1
- data/lib/perobs/BTree.rb +233 -0
- data/lib/perobs/BTreeDB.rb +2 -0
- data/lib/perobs/BTreeNode.rb +706 -0
- data/lib/perobs/BTreeNodeCache.rb +107 -0
- data/lib/perobs/BTreeNodeLink.rb +141 -0
- data/lib/perobs/EquiBlobsFile.rb +570 -0
- data/lib/perobs/FlatFile.rb +179 -78
- data/lib/perobs/FlatFileBlobHeader.rb +92 -17
- data/lib/perobs/FlatFileDB.rb +16 -7
- data/lib/perobs/LockFile.rb +181 -0
- data/lib/perobs/Object.rb +2 -1
- data/lib/perobs/SpaceTree.rb +181 -0
- data/lib/perobs/SpaceTreeNode.rb +672 -0
- data/lib/perobs/SpaceTreeNodeCache.rb +76 -0
- data/lib/perobs/SpaceTreeNodeLink.rb +103 -0
- data/lib/perobs/Store.rb +27 -13
- data/lib/perobs/version.rb +1 -1
- data/test/BTree_spec.rb +128 -0
- data/test/EquiBlobsFile_spec.rb +199 -0
- data/test/FlatFileDB_spec.rb +63 -9
- data/test/LockFile_spec.rb +133 -0
- data/test/SpaceTree_spec.rb +245 -0
- data/test/Store_spec.rb +3 -0
- data/test/spec_helper.rb +13 -0
- metadata +21 -13
- data/lib/perobs/FixedSizeBlobFile.rb +0 -193
- data/lib/perobs/FreeSpaceManager.rb +0 -204
- data/lib/perobs/IndexTree.rb +0 -145
- data/lib/perobs/IndexTreeNode.rb +0 -316
- data/test/FixedSizeBlobFile_spec.rb +0 -91
- data/test/FreeSpaceManager_spec.rb +0 -91
- data/test/IndexTree_spec.rb +0 -118
data/lib/perobs/FlatFile.rb
CHANGED
@@ -29,8 +29,8 @@ require 'zlib'
|
|
29
29
|
|
30
30
|
require 'perobs/Log'
|
31
31
|
require 'perobs/FlatFileBlobHeader'
|
32
|
-
require 'perobs/
|
33
|
-
require 'perobs/
|
32
|
+
require 'perobs/BTree'
|
33
|
+
require 'perobs/SpaceTree'
|
34
34
|
|
35
35
|
module PEROBS
|
36
36
|
|
@@ -39,34 +39,59 @@ module PEROBS
|
|
39
39
|
# blob data bytes.
|
40
40
|
class FlatFile
|
41
41
|
|
42
|
+
# The number of entries in a single BTree node of the index file.
|
43
|
+
INDEX_BTREE_ORDER = 65
|
44
|
+
|
42
45
|
# Create a new FlatFile object for a database in the given path.
|
43
46
|
# @param dir [String] Directory path for the data base file
|
44
47
|
def initialize(dir)
|
45
48
|
@db_dir = dir
|
46
49
|
@f = nil
|
47
|
-
@index =
|
48
|
-
@space_list =
|
50
|
+
@index = BTree.new(@db_dir, 'index', INDEX_BTREE_ORDER)
|
51
|
+
@space_list = SpaceTree.new(@db_dir)
|
49
52
|
end
|
50
53
|
|
51
54
|
# Open the flat file for reading and writing.
|
52
55
|
def open
|
53
56
|
file_name = File.join(@db_dir, 'database.blobs')
|
57
|
+
new_db_created = false
|
54
58
|
begin
|
55
59
|
if File.exist?(file_name)
|
56
60
|
@f = File.open(file_name, 'rb+')
|
57
61
|
else
|
58
|
-
PEROBS.log.info
|
62
|
+
PEROBS.log.info "New FlatFile database '#{file_name}' created"
|
59
63
|
@f = File.open(file_name, 'wb+')
|
64
|
+
new_db_created = true
|
60
65
|
end
|
61
66
|
rescue IOError => e
|
62
|
-
PEROBS.log.fatal "Cannot open
|
67
|
+
PEROBS.log.fatal "Cannot open FlatFile database #{file_name}: " +
|
63
68
|
e.message
|
64
69
|
end
|
65
70
|
unless @f.flock(File::LOCK_NB | File::LOCK_EX)
|
66
|
-
PEROBS.log.fatal '
|
71
|
+
PEROBS.log.fatal "FlatFile database '#{file_name}' is locked by " +
|
72
|
+
"another process"
|
73
|
+
end
|
74
|
+
|
75
|
+
begin
|
76
|
+
@index.open(!new_db_created)
|
77
|
+
@space_list.open
|
78
|
+
rescue FatalError
|
79
|
+
# Ensure that the index is really closed.
|
80
|
+
@index.close
|
81
|
+
# Erase it completely
|
82
|
+
@index.erase
|
83
|
+
# Then create it again.
|
84
|
+
@index.open
|
85
|
+
|
86
|
+
# Ensure that the spaces list is really closed.
|
87
|
+
@space_list.close
|
88
|
+
# Erase it completely
|
89
|
+
@space_list.erase
|
90
|
+
# Then create it again
|
91
|
+
@space_list.open
|
92
|
+
|
93
|
+
regenerate_index_and_spaces
|
67
94
|
end
|
68
|
-
@index.open
|
69
|
-
@space_list.open
|
70
95
|
end
|
71
96
|
|
72
97
|
# Close the flat file. This method must be called to ensure that all data
|
@@ -74,10 +99,13 @@ module PEROBS
|
|
74
99
|
def close
|
75
100
|
@space_list.close
|
76
101
|
@index.close
|
77
|
-
|
78
|
-
@f
|
79
|
-
|
80
|
-
|
102
|
+
|
103
|
+
if @f
|
104
|
+
@f.flush
|
105
|
+
@f.flock(File::LOCK_UN)
|
106
|
+
@f.close
|
107
|
+
@f = nil
|
108
|
+
end
|
81
109
|
end
|
82
110
|
|
83
111
|
# Force outstanding data to be written to the filesystem.
|
@@ -87,6 +115,7 @@ module PEROBS
|
|
87
115
|
rescue IOError => e
|
88
116
|
PEROBS.log.fatal "Cannot sync flat file database: #{e.message}"
|
89
117
|
end
|
118
|
+
@index.sync
|
90
119
|
end
|
91
120
|
|
92
121
|
# Delete the blob for the specified ID.
|
@@ -105,16 +134,10 @@ module PEROBS
|
|
105
134
|
# @param addr [Integer] Address of the blob to delete
|
106
135
|
# @param id [Integer] ID of the blob to delete
|
107
136
|
def delete_obj_by_address(addr, id)
|
108
|
-
@index.
|
137
|
+
@index.remove(id)
|
109
138
|
header = FlatFileBlobHeader.read_at(@f, addr, id)
|
110
|
-
|
111
|
-
|
112
|
-
@f.write([ 0 ].pack('C'))
|
113
|
-
@f.flush
|
114
|
-
@space_list.add_space(addr, header.length)
|
115
|
-
rescue IOError => e
|
116
|
-
PEROBS.log.fatal "Cannot erase blob for ID #{header.id}: #{e.message}"
|
117
|
-
end
|
139
|
+
header.clear_flags
|
140
|
+
@space_list.add_space(addr, header.length)
|
118
141
|
end
|
119
142
|
|
120
143
|
# Delete all unmarked objects.
|
@@ -136,12 +159,23 @@ module PEROBS
|
|
136
159
|
deleted_ids
|
137
160
|
end
|
138
161
|
|
139
|
-
# Write the given object into the file. This method
|
140
|
-
#
|
162
|
+
# Write the given object into the file. This method never uses in-place
|
163
|
+
# updates for existing objects. A new copy is inserted first and only when
|
164
|
+
# the insert was successful, the old copy is deleted and the index
|
165
|
+
# updated.
|
141
166
|
# @param id [Integer] ID of the object
|
142
167
|
# @param raw_obj [String] Raw object as String
|
143
168
|
# @return [Integer] position of the written blob in the blob file
|
144
169
|
def write_obj_by_id(id, raw_obj)
|
170
|
+
# Check if we have already an object with the given ID. We'll mark it as
|
171
|
+
# outdated and save the header for later deletion. In case this
|
172
|
+
# operation is aborted or interrupted we ensure that we either have the
|
173
|
+
# old or the new version available.
|
174
|
+
if (old_addr = find_obj_addr_by_id(id))
|
175
|
+
old_header = FlatFileBlobHeader.read_at(@f, old_addr)
|
176
|
+
old_header.set_outdated_flag
|
177
|
+
end
|
178
|
+
|
145
179
|
crc = checksum(raw_obj)
|
146
180
|
|
147
181
|
# If the raw_obj is larger then 256 characters we will compress it to
|
@@ -168,12 +202,12 @@ module PEROBS
|
|
168
202
|
"blob space (#{header.length})."
|
169
203
|
end
|
170
204
|
if header.is_valid?
|
171
|
-
PEROBS.log.fatal "Entry (
|
205
|
+
PEROBS.log.fatal "Entry (flags: #{header.flags}) is already used."
|
172
206
|
end
|
173
207
|
end
|
174
|
-
|
175
|
-
|
176
|
-
|
208
|
+
flags = 1 << FlatFileBlobHeader::VALID_FLAG_BIT
|
209
|
+
flags |= (1 << FlatFileBlobHeader::COMPRESSED_FLAG_BIT) if compressed
|
210
|
+
FlatFileBlobHeader.new(@f, addr, flags, raw_obj.length, id, crc).write
|
177
211
|
@f.write(raw_obj)
|
178
212
|
if length != -1 && raw_obj.length < length
|
179
213
|
# The new object was not appended and it did not completely fill the
|
@@ -186,12 +220,20 @@ module PEROBS
|
|
186
220
|
end
|
187
221
|
space_address = @f.pos
|
188
222
|
space_length = length - FlatFileBlobHeader::LENGTH - raw_obj.length
|
189
|
-
FlatFileBlobHeader.new(
|
223
|
+
FlatFileBlobHeader.new(@f, space_address, 0, space_length,
|
224
|
+
0, 0).write
|
190
225
|
# Register the new space with the space list.
|
191
226
|
@space_list.add_space(space_address, space_length) if space_length > 0
|
192
227
|
end
|
193
|
-
|
194
|
-
|
228
|
+
if old_addr
|
229
|
+
# If we had an existing object stored for the ID we have to mark
|
230
|
+
# this entry as deleted now.
|
231
|
+
old_header.clear_flags
|
232
|
+
else
|
233
|
+
@f.flush
|
234
|
+
end
|
235
|
+
# Once the blob has been written we can update the index as well.
|
236
|
+
@index.insert(id, addr)
|
195
237
|
rescue IOError => e
|
196
238
|
PEROBS.log.fatal "Cannot write blob for ID #{id} to FlatFileDB: " +
|
197
239
|
e.message
|
@@ -204,7 +246,7 @@ module PEROBS
|
|
204
246
|
# @param id [Integer] ID of the object
|
205
247
|
# @return [Integer] Offset in the flat file or nil if not found
|
206
248
|
def find_obj_addr_by_id(id)
|
207
|
-
@index.
|
249
|
+
@index.get(id)
|
208
250
|
end
|
209
251
|
|
210
252
|
# Read the object with the given ID.
|
@@ -238,9 +280,14 @@ module PEROBS
|
|
238
280
|
PEROBS.log.fatal "Cannot read blob for ID #{id}: #{e.message}"
|
239
281
|
end
|
240
282
|
|
241
|
-
# Uncompress the data if the compression bit is set in the
|
283
|
+
# Uncompress the data if the compression bit is set in the flags byte.
|
242
284
|
if header.is_compressed?
|
243
|
-
|
285
|
+
begin
|
286
|
+
buf = Zlib.inflate(buf)
|
287
|
+
rescue Zlib::BufError, Zlib::DataError
|
288
|
+
PEROBS.log.fatal "Corrupted compressed block with ID " +
|
289
|
+
"#{header.id} found."
|
290
|
+
end
|
244
291
|
end
|
245
292
|
|
246
293
|
if checksum(buf) != header.crc
|
@@ -262,15 +309,7 @@ module PEROBS
|
|
262
309
|
# @param addr [Integer] Offset in the file
|
263
310
|
# @param id [Integer] ID of the object
|
264
311
|
def mark_obj_by_address(addr, id)
|
265
|
-
|
266
|
-
begin
|
267
|
-
@f.seek(addr)
|
268
|
-
@f.write([ header.mark | (1 << 1) ].pack('C'))
|
269
|
-
@f.flush
|
270
|
-
rescue IOError => e
|
271
|
-
PEROBS.log.fatal "Marking of FlatFile blob with ID #{id} " +
|
272
|
-
"failed: #{e.message}"
|
273
|
-
end
|
312
|
+
FlatFileBlobHeader.read_at(@f, addr, id).set_mark_flag
|
274
313
|
end
|
275
314
|
|
276
315
|
# Return true if the object with the given ID is marked, false otherwise.
|
@@ -297,14 +336,7 @@ module PEROBS
|
|
297
336
|
if header.is_valid? && header.is_marked?
|
298
337
|
# Clear all valid and marked blocks.
|
299
338
|
marked_blob_count += 1
|
300
|
-
|
301
|
-
@f.seek(pos)
|
302
|
-
@f.write([ header.mark & 0b11111101 ].pack('C'))
|
303
|
-
@f.flush
|
304
|
-
rescue IOError => e
|
305
|
-
PEROBS.log.fatal "Unmarking of FlatFile blob with ID #{blob_id} " +
|
306
|
-
"failed: #{e.message}"
|
307
|
-
end
|
339
|
+
header.clear_mark_flag
|
308
340
|
end
|
309
341
|
end
|
310
342
|
PEROBS.log.info "#{marked_blob_count} marks in #{total_blob_count} " +
|
@@ -315,6 +347,7 @@ module PEROBS
|
|
315
347
|
# implementation. No additional space will be needed on the file system.
|
316
348
|
def defragmentize
|
317
349
|
distance = 0
|
350
|
+
new_file_size = 0
|
318
351
|
deleted_blobs = 0
|
319
352
|
valid_blobs = 0
|
320
353
|
t = Time.now
|
@@ -335,17 +368,19 @@ module PEROBS
|
|
335
368
|
@f.seek(pos - distance)
|
336
369
|
@f.write(buf)
|
337
370
|
# Update the index with the new position
|
338
|
-
@index.
|
371
|
+
@index.insert(header.id, pos - distance)
|
339
372
|
# Mark the space between the relocated current entry and the
|
340
373
|
# next valid entry as deleted space.
|
341
|
-
FlatFileBlobHeader.new(
|
342
|
-
|
374
|
+
FlatFileBlobHeader.new(@f, @f.pos, 0,
|
375
|
+
distance - FlatFileBlobHeader::LENGTH,
|
376
|
+
0, 0).write
|
343
377
|
@f.flush
|
344
378
|
rescue IOError => e
|
345
379
|
PEROBS.log.fatal "Error while moving blob for ID #{header.id}: " +
|
346
380
|
e.message
|
347
381
|
end
|
348
382
|
end
|
383
|
+
new_file_size = pos + FlatFileBlobHeader::LENGTH + header.length
|
349
384
|
else
|
350
385
|
deleted_blobs += 1
|
351
386
|
distance += entry_bytes
|
@@ -357,7 +392,7 @@ module PEROBS
|
|
357
392
|
"#{'%.1f' % (distance.to_f / @f.size * 100.0)}% reclaimed"
|
358
393
|
|
359
394
|
@f.flush
|
360
|
-
@f.truncate(
|
395
|
+
@f.truncate(new_file_size)
|
361
396
|
@f.flush
|
362
397
|
@space_list.clear
|
363
398
|
|
@@ -393,56 +428,116 @@ module PEROBS
|
|
393
428
|
defragmentize
|
394
429
|
end
|
395
430
|
|
431
|
+
# Check (and repair) the FlatFile.
|
432
|
+
# @param repair [Boolean] True if errors should be fixed.
|
433
|
+
# @return [Integer] Number of errors found
|
396
434
|
def check(repair = false)
|
397
|
-
|
435
|
+
errors = 0
|
436
|
+
return errors unless @f
|
398
437
|
|
399
438
|
t = Time.now
|
400
439
|
PEROBS.log.info "Checking FlatFile database" +
|
401
440
|
"#{repair ? ' in repair mode' : ''}..."
|
402
441
|
|
403
442
|
# First check the database blob file. Each entry should be readable and
|
404
|
-
# correct.
|
443
|
+
# correct and all IDs must be unique. We use a shadow index to keep
|
444
|
+
# track of the already found IDs.
|
445
|
+
new_index = BTree.new(@db_dir, 'new-index', INDEX_BTREE_ORDER)
|
446
|
+
new_index.erase
|
447
|
+
new_index.open
|
448
|
+
|
405
449
|
each_blob_header do |pos, header|
|
406
450
|
if header.is_valid?
|
407
451
|
# We have a non-deleted entry.
|
408
452
|
begin
|
409
453
|
@f.seek(pos + FlatFileBlobHeader::LENGTH)
|
410
454
|
buf = @f.read(header.length)
|
455
|
+
if buf.length != header.length
|
456
|
+
PEROBS.log.error "Premature end of file in blob with ID " +
|
457
|
+
"#{header.id}."
|
458
|
+
discard_damaged_blob(header) if repair
|
459
|
+
errors += 1
|
460
|
+
next
|
461
|
+
end
|
462
|
+
|
411
463
|
# Uncompress the data if the compression bit is set in the mark
|
412
464
|
# byte.
|
413
|
-
|
465
|
+
if header.is_compressed?
|
466
|
+
begin
|
467
|
+
buf = Zlib.inflate(buf)
|
468
|
+
rescue Zlib::BufError, Zlib::DataError
|
469
|
+
PEROBS.log.error "Corrupted compressed block with ID " +
|
470
|
+
"#{header.id} found."
|
471
|
+
discard_damaged_blob(header) if repair
|
472
|
+
errors += 1
|
473
|
+
next
|
474
|
+
end
|
475
|
+
end
|
414
476
|
|
415
477
|
if header.crc && checksum(buf) != header.crc
|
416
|
-
|
417
|
-
|
418
|
-
|
419
|
-
|
420
|
-
|
421
|
-
PEROBS.log.fatal "Checksum failure while checking blob " +
|
422
|
-
"with ID #{header.id}"
|
423
|
-
end
|
478
|
+
PEROBS.log.error "Checksum failure while checking blob " +
|
479
|
+
"with ID #{header.id}"
|
480
|
+
discard_damaged_blob(header) if repair
|
481
|
+
errors += 1
|
482
|
+
next
|
424
483
|
end
|
425
484
|
rescue IOError => e
|
426
485
|
PEROBS.log.fatal "Check of blob with ID #{header.id} failed: " +
|
427
486
|
e.message
|
428
487
|
end
|
488
|
+
|
489
|
+
# Check if the ID has already been found in the file.
|
490
|
+
if (previous_address = new_index.get(header.id))
|
491
|
+
PEROBS.log.error "Multiple blobs for ID #{header.id} found. " +
|
492
|
+
"Addresses: #{previous_address}, #{pos}"
|
493
|
+
previous_header = FlatFileBlobHeader.read_at(@f, previous_address,
|
494
|
+
header.id)
|
495
|
+
if repair
|
496
|
+
# We have two blobs with the same ID and we must discard one of
|
497
|
+
# them.
|
498
|
+
if header.is_outdated?
|
499
|
+
discard_damaged_blob(header)
|
500
|
+
elsif previous_header.is_outdated?
|
501
|
+
discard_damaged_blob(previous_header)
|
502
|
+
else
|
503
|
+
PEROBS.log.error "None of the blobs with same ID have " +
|
504
|
+
"the outdated flag set. Deleting the smaller one."
|
505
|
+
discard_damaged_blob(header.length < previous_header.length ?
|
506
|
+
header : previous_header)
|
507
|
+
end
|
508
|
+
next
|
509
|
+
end
|
510
|
+
else
|
511
|
+
# ID is unique so far. Add it to the shadow index.
|
512
|
+
new_index.insert(header.id, pos)
|
513
|
+
end
|
514
|
+
|
429
515
|
end
|
430
516
|
end
|
517
|
+
# We no longer need the new index.
|
518
|
+
new_index.close
|
519
|
+
new_index.erase
|
431
520
|
|
432
521
|
# Now we check the index data. It must be correct and the entries must
|
433
522
|
# match the blob file. All entries in the index must be in the blob file
|
434
523
|
# and vise versa.
|
435
524
|
begin
|
436
|
-
|
437
|
-
|
525
|
+
index_ok = @index.check do |id, address|
|
526
|
+
has_id_at?(id, address)
|
527
|
+
end
|
528
|
+
unless index_ok && @space_list.check(self) && cross_check_entries
|
438
529
|
regenerate_index_and_spaces if repair
|
439
530
|
end
|
440
531
|
rescue PEROBS::FatalError
|
532
|
+
errors += 1
|
441
533
|
regenerate_index_and_spaces if repair
|
442
534
|
end
|
443
535
|
|
444
536
|
sync if repair
|
445
|
-
PEROBS.log.info "check_db completed in #{Time.now - t} seconds"
|
537
|
+
PEROBS.log.info "check_db completed in #{Time.now - t} seconds. " +
|
538
|
+
"#{errors} errors found."
|
539
|
+
|
540
|
+
errors
|
446
541
|
end
|
447
542
|
|
448
543
|
# This method clears the index tree and the free space list and
|
@@ -454,7 +549,7 @@ module PEROBS
|
|
454
549
|
|
455
550
|
each_blob_header do |pos, header|
|
456
551
|
if header.is_valid?
|
457
|
-
@index.
|
552
|
+
@index.insert(header.id, pos)
|
458
553
|
else
|
459
554
|
@space_list.add_space(pos, header.length) if header.length > 0
|
460
555
|
end
|
@@ -474,7 +569,7 @@ module PEROBS
|
|
474
569
|
def inspect
|
475
570
|
s = '['
|
476
571
|
each_blob_header do |pos, header|
|
477
|
-
s << "{ :pos => #{pos}, :
|
572
|
+
s << "{ :pos => #{pos}, :flags => #{header.flags}, " +
|
478
573
|
":length => #{header.length}, :id => #{header.id}, " +
|
479
574
|
":crc => #{header.crc}"
|
480
575
|
if header.is_valid?
|
@@ -485,8 +580,6 @@ module PEROBS
|
|
485
580
|
s + ']'
|
486
581
|
end
|
487
582
|
|
488
|
-
|
489
|
-
|
490
583
|
private
|
491
584
|
|
492
585
|
def each_blob_header(&block)
|
@@ -529,6 +622,8 @@ module PEROBS
|
|
529
622
|
end
|
530
623
|
|
531
624
|
def cross_check_entries
|
625
|
+
errors = 0
|
626
|
+
|
532
627
|
each_blob_header do |pos, header|
|
533
628
|
if !header.is_valid?
|
534
629
|
if header.length > 0
|
@@ -536,19 +631,25 @@ module PEROBS
|
|
536
631
|
PEROBS.log.error "FlatFile has free space " +
|
537
632
|
"(addr: #{pos}, len: #{header.length}) that is not in " +
|
538
633
|
"FreeSpaceManager"
|
539
|
-
|
634
|
+
errors += 1
|
540
635
|
end
|
541
636
|
end
|
542
637
|
else
|
543
|
-
unless @index.
|
638
|
+
unless @index.get(header.id) == pos
|
544
639
|
PEROBS.log.error "FlatFile blob at address #{pos} is listed " +
|
545
|
-
"in index with address #{@index.
|
546
|
-
|
640
|
+
"in index with address #{@index.get(header.id)}"
|
641
|
+
errors += 1
|
547
642
|
end
|
548
643
|
end
|
549
644
|
end
|
550
645
|
|
551
|
-
|
646
|
+
errors == 0
|
647
|
+
end
|
648
|
+
|
649
|
+
def discard_damaged_blob(header)
|
650
|
+
PEROBS.log.error "Discarding corrupted data blob for ID #{header.id} " +
|
651
|
+
"at offset #{header.addr}"
|
652
|
+
header.clear_flags
|
552
653
|
end
|
553
654
|
|
554
655
|
end
|
@@ -31,16 +31,17 @@ module PEROBS
|
|
31
31
|
|
32
32
|
# The FlatFile blob header has the following structure:
|
33
33
|
#
|
34
|
-
# 1 Byte:
|
34
|
+
# 1 Byte: Flags byte.
|
35
35
|
# Bit 0: 0 deleted entry, 1 valid entry
|
36
36
|
# Bit 1: 0 unmarked, 1 marked
|
37
37
|
# Bit 2: 0 uncompressed data, 1 compressed data
|
38
|
-
# Bit 3
|
38
|
+
# Bit 3: 0 current entry, 1 outdated entry
|
39
|
+
# Bit 4 - 7: reserved, must be 0
|
39
40
|
# 8 bytes: Length of the data blob in bytes
|
40
41
|
# 8 bytes: ID of the value in the data blob
|
41
42
|
# 4 bytes: CRC32 checksum of the data blob
|
42
43
|
#
|
43
|
-
# If the bit 0 of the
|
44
|
+
# If the bit 0 of the flags byte is 0, only the length is valid. The blob is
|
44
45
|
# empty. Only of bit 0 is set then entry is valid.
|
45
46
|
class FlatFileBlobHeader
|
46
47
|
|
@@ -48,16 +49,24 @@ module PEROBS
|
|
48
49
|
FORMAT = 'CQQL'
|
49
50
|
# The length of the header in bytes.
|
50
51
|
LENGTH = 21
|
52
|
+
VALID_FLAG_BIT = 0
|
53
|
+
MARK_FLAG_BIT = 1
|
54
|
+
COMPRESSED_FLAG_BIT = 2
|
55
|
+
OUTDATED_FLAG_BIT = 3
|
51
56
|
|
52
|
-
attr_reader :
|
57
|
+
attr_reader :addr, :flags, :length, :id, :crc
|
53
58
|
|
54
|
-
# Create a new FlatFileBlobHeader with the given
|
55
|
-
# @param
|
59
|
+
# Create a new FlatFileBlobHeader with the given flags, length, id and crc.
|
60
|
+
# @param file [File] the FlatFile that contains the header
|
61
|
+
# @param addr [Integer] the offset address of the header in the file
|
62
|
+
# @param flags [Fixnum] 8 bit number, see above
|
56
63
|
# @param length [Fixnum] length of the header in bytes
|
57
64
|
# @param id [Integer] ID of the blob entry
|
58
65
|
# @param crc [Fixnum] CRC32 checksum of the blob entry
|
59
|
-
def initialize(
|
60
|
-
@
|
66
|
+
def initialize(file, addr, flags, length, id, crc)
|
67
|
+
@file = file
|
68
|
+
@addr = addr
|
69
|
+
@flags = flags
|
61
70
|
@length = length
|
62
71
|
@id = id
|
63
72
|
@crc = crc
|
@@ -68,14 +77,22 @@ module PEROBS
|
|
68
77
|
# @return FlatFileBlobHeader
|
69
78
|
def FlatFileBlobHeader::read(file)
|
70
79
|
begin
|
80
|
+
addr = file.pos
|
71
81
|
buf = file.read(LENGTH)
|
72
82
|
rescue IOError => e
|
73
|
-
PEROBS.log.
|
83
|
+
PEROBS.log.error "Cannot read blob header in flat file DB: #{e.message}"
|
84
|
+
return nil
|
74
85
|
end
|
75
86
|
|
76
87
|
return nil unless buf
|
77
88
|
|
78
|
-
|
89
|
+
if buf.length != LENGTH
|
90
|
+
PEROBS.log.error "Incomplete FlatFileBlobHeader: Only #{buf.length} " +
|
91
|
+
"bytes of #{LENGTH} could be read"
|
92
|
+
return nil
|
93
|
+
end
|
94
|
+
|
95
|
+
FlatFileBlobHeader.new(file, addr, *buf.unpack(FORMAT))
|
79
96
|
end
|
80
97
|
|
81
98
|
# Read the header from the given File.
|
@@ -96,7 +113,7 @@ module PEROBS
|
|
96
113
|
"#{id ? "for ID #{id} " : ''}at address " +
|
97
114
|
"#{addr}"
|
98
115
|
end
|
99
|
-
header = FlatFileBlobHeader.new(*buf.unpack(FORMAT))
|
116
|
+
header = FlatFileBlobHeader.new(file, addr, *buf.unpack(FORMAT))
|
100
117
|
if id && header.id != id
|
101
118
|
PEROBS.log.fatal "Mismatch between FlatFile index and blob file " +
|
102
119
|
"found for entry with ID #{id}/#{header.id}"
|
@@ -107,35 +124,93 @@ module PEROBS
|
|
107
124
|
|
108
125
|
# Write the header to a given File.
|
109
126
|
# @param file [File]
|
110
|
-
def write
|
127
|
+
def write
|
111
128
|
begin
|
112
|
-
file.
|
129
|
+
@file.seek(@addr)
|
130
|
+
@file.write([ @flags, @length, @id, @crc].pack(FORMAT))
|
113
131
|
rescue IOError => e
|
114
132
|
PEROBS.log.fatal "Cannot write blob header into flat file DB: " +
|
115
133
|
e.message
|
116
134
|
end
|
117
135
|
end
|
118
136
|
|
137
|
+
# Reset all the flags bit to 0. This marks the blob as invalid.
|
138
|
+
# @param file [File] The file handle of the blob file.
|
139
|
+
# @param addr [Integer] The address of the header
|
140
|
+
def clear_flags
|
141
|
+
begin
|
142
|
+
@file.seek(@addr)
|
143
|
+
@file.write([ 0 ].pack('C'))
|
144
|
+
@file.flush
|
145
|
+
rescue IOError => e
|
146
|
+
PEROBS.log.fatal "Clearing flags of FlatFileBlobHeader with ID " +
|
147
|
+
"#{@id} failed: #{e.message}"
|
148
|
+
end
|
149
|
+
end
|
150
|
+
|
119
151
|
# Return true if the header is for a non-empty blob.
|
120
152
|
def is_valid?
|
121
|
-
bit_set?(
|
153
|
+
bit_set?(VALID_FLAG_BIT)
|
122
154
|
end
|
123
155
|
|
124
156
|
# Return true if the blob has been marked.
|
125
157
|
def is_marked?
|
126
|
-
bit_set?(
|
158
|
+
bit_set?(MARK_FLAG_BIT)
|
159
|
+
end
|
160
|
+
|
161
|
+
# Set the mark bit.
|
162
|
+
def set_mark_flag
|
163
|
+
set_flag(MARK_FLAG_BIT)
|
164
|
+
write_flags
|
165
|
+
end
|
166
|
+
|
167
|
+
# Clear the mark bit.
|
168
|
+
def clear_mark_flag
|
169
|
+
clear_flag(MARK_FLAG_BIT)
|
170
|
+
write_flags
|
127
171
|
end
|
128
172
|
|
129
173
|
# Return true if the blob contains compressed data.
|
130
174
|
def is_compressed?
|
131
|
-
bit_set?(
|
175
|
+
bit_set?(COMPRESSED_FLAG_BIT)
|
176
|
+
end
|
177
|
+
|
178
|
+
# Set the outdated bit. The entry will be invalid as soon as the current
|
179
|
+
# transaction has been completed.
|
180
|
+
def set_outdated_flag
|
181
|
+
set_flag(OUTDATED_FLAG_BIT)
|
182
|
+
write_flags
|
183
|
+
end
|
184
|
+
|
185
|
+
# Return true if the blob contains outdated data.
|
186
|
+
def is_outdated?
|
187
|
+
bit_set?(OUTDATED_FLAG_BIT)
|
132
188
|
end
|
133
189
|
|
134
190
|
private
|
135
191
|
|
192
|
+
def write_flags
|
193
|
+
begin
|
194
|
+
@file.seek(@addr)
|
195
|
+
@file.write([ @flags ].pack('C'))
|
196
|
+
@file.flush
|
197
|
+
rescue IOError => e
|
198
|
+
PEROBS.log.fatal "Writing flags of FlatFileBlobHeader with ID #{@id} " +
|
199
|
+
"failed: #{e.message}"
|
200
|
+
end
|
201
|
+
end
|
202
|
+
|
136
203
|
def bit_set?(n)
|
137
204
|
mask = 1 << n
|
138
|
-
@
|
205
|
+
@flags & mask == mask
|
206
|
+
end
|
207
|
+
|
208
|
+
def set_flag(n)
|
209
|
+
@flags |= (1 << n)
|
210
|
+
end
|
211
|
+
|
212
|
+
def clear_flag(n)
|
213
|
+
@flags &= ~(1 << n) & 0xFF
|
139
214
|
end
|
140
215
|
|
141
216
|
end
|