isomorfeus-ferret 0.13.5 → 0.13.6
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +4 -4
- data/ext/isomorfeus_ferret_ext/frt_compound_io.c +4 -1
- data/ext/isomorfeus_ferret_ext/frt_fs_store.c +2 -4
- data/ext/isomorfeus_ferret_ext/frt_index.c +27 -60
- data/ext/isomorfeus_ferret_ext/frt_index.h +2 -2
- data/ext/isomorfeus_ferret_ext/test.c +1 -1
- data/ext/isomorfeus_ferret_ext/test_compound_io.c +3 -3
- data/ext/isomorfeus_ferret_ext/test_hash.c +1 -0
- data/lib/isomorfeus/ferret/version.rb +1 -1
- metadata +2 -2
checksums.yaml
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
---
|
2
2
|
SHA256:
|
3
|
-
metadata.gz:
|
4
|
-
data.tar.gz:
|
3
|
+
metadata.gz: 524b384c2ab35457603726287160b443a50939473bab7852e5e6f5f886ded0a7
|
4
|
+
data.tar.gz: b304d0386bc0b14e68167bfcc1b62346f81c02f6eff25c3a6633bb0a1919083e
|
5
5
|
SHA512:
|
6
|
-
metadata.gz:
|
7
|
-
data.tar.gz:
|
6
|
+
metadata.gz: b378ce12aa56bb35e57eec2c8df64152a7a7bd5cb1345d4a7dc0264e236fddcea3ffbc41a7213401cf50ff163c3172169fbf93699a4a7f96505f300782bc9a92
|
7
|
+
data.tar.gz: 6954e297df285f7726bd925a6f4dda4300f06d059dc4b674a494e775b901f7ea9e529e62be8793049c6df20a17515c41741f63155fbdd661de4595694deb4c27
|
@@ -329,7 +329,7 @@ static void cw_copy_file(FrtCompoundWriter *cw, FrtCWFileEntry *src, FrtOutStrea
|
|
329
329
|
frt_is_close(is);
|
330
330
|
}
|
331
331
|
|
332
|
-
void frt_cw_close(FrtCompoundWriter *cw)
|
332
|
+
void frt_cw_close(FrtCompoundWriter *cw, FrtDeleter *dlr)
|
333
333
|
{
|
334
334
|
FrtOutStream *os = NULL;
|
335
335
|
int i;
|
@@ -356,6 +356,9 @@ void frt_cw_close(FrtCompoundWriter *cw)
|
|
356
356
|
for (i = 0; i < frt_ary_size(cw->file_entries); i++) {
|
357
357
|
cw->file_entries[i].data_offset = frt_os_pos(os);
|
358
358
|
cw_copy_file(cw, &cw->file_entries[i], os);
|
359
|
+
if (dlr) {
|
360
|
+
frt_deleter_queue_file(dlr, cw->file_entries[i].name);
|
361
|
+
}
|
359
362
|
}
|
360
363
|
|
361
364
|
/* Write the data offsets into the directory of the compound stream */
|
@@ -272,15 +272,13 @@ static const struct FrtOutStreamMethods FS_OUT_STREAM_METHODS = {
|
|
272
272
|
static FrtOutStream *fs_new_output(FrtStore *store, const char *filename)
|
273
273
|
{
|
274
274
|
char path[FRT_MAX_FILE_PATH];
|
275
|
-
int fd = open(join_path(path, store->dir.path, filename),
|
276
|
-
O_WRONLY | O_CREAT | O_BINARY, store->file_mode);
|
277
|
-
FrtOutStream *os;
|
275
|
+
int fd = open(join_path(path, store->dir.path, filename), O_WRONLY | O_CREAT | O_BINARY, store->file_mode);
|
278
276
|
if (fd < 0) {
|
279
277
|
FRT_RAISE(FRT_IO_ERROR, "couldn't create OutStream %s: <%s>",
|
280
278
|
path, strerror(errno));
|
281
279
|
}
|
282
280
|
|
283
|
-
os = frt_os_new();
|
281
|
+
FrtOutStream *os = frt_os_new();
|
284
282
|
os->file.fd = fd;
|
285
283
|
os->m = &FS_OUT_STREAM_METHODS;
|
286
284
|
return os;
|
@@ -681,15 +681,13 @@ static char *si_norm_file_name(FrtSegmentInfo *si, char *buf, int field_num)
|
|
681
681
|
if (field_num >= si->norm_gens_size
|
682
682
|
|| 0 > (norm_gen = si->norm_gens[field_num])) {
|
683
683
|
return NULL;
|
684
|
-
}
|
685
|
-
else {
|
684
|
+
} else {
|
686
685
|
const char *ext = (si->use_compound_file && norm_gen > 0) ? "s" : "f";
|
687
686
|
return fn_for_gen_field(buf, si->name, ext, norm_gen, field_num);
|
688
687
|
}
|
689
688
|
}
|
690
689
|
|
691
|
-
|
692
|
-
#define DEL(file_name) deleter_queue_file(dlr, file_name)
|
690
|
+
void frt_deleter_queue_file(FrtDeleter *dlr, const char *file_name);
|
693
691
|
|
694
692
|
static void si_delete_files(FrtSegmentInfo *si, FrtFieldInfos *fis, FrtDeleter *dlr)
|
695
693
|
{
|
@@ -700,7 +698,7 @@ static void si_delete_files(FrtSegmentInfo *si, FrtFieldInfos *fis, FrtDeleter *
|
|
700
698
|
|
701
699
|
for (i = si->norm_gens_size - 1; i >= 0; i--) {
|
702
700
|
if (0 <= si->norm_gens[i]) {
|
703
|
-
|
701
|
+
frt_deleter_queue_file(dlr, si_norm_file_name(si, file_name, fis->fields[i]->number));
|
704
702
|
}
|
705
703
|
}
|
706
704
|
|
@@ -710,15 +708,14 @@ static void si_delete_files(FrtSegmentInfo *si, FrtFieldInfos *fis, FrtDeleter *
|
|
710
708
|
|
711
709
|
if (si->use_compound_file) {
|
712
710
|
memcpy(ext, "cfs", 4);
|
713
|
-
|
711
|
+
frt_deleter_queue_file(dlr, file_name);
|
714
712
|
if (0 <= si->del_gen) {
|
715
|
-
|
713
|
+
frt_deleter_queue_file(dlr, frt_fn_for_generation(file_name, si->name, "del", si->del_gen));
|
716
714
|
}
|
717
|
-
}
|
718
|
-
else {
|
715
|
+
} else {
|
719
716
|
for (i = FRT_NELEMS(INDEX_EXTENSIONS) - 1; i >= 0; i--) {
|
720
717
|
memcpy(ext, INDEX_EXTENSIONS[i], 4);
|
721
|
-
|
718
|
+
frt_deleter_queue_file(dlr, file_name);
|
722
719
|
}
|
723
720
|
}
|
724
721
|
}
|
@@ -3695,8 +3692,7 @@ static bool file_name_filter_is_cfs_file(const char *file_name) {
|
|
3695
3692
|
****************************************************************************/
|
3696
3693
|
|
3697
3694
|
#define DELETABLE_START_CAPA 8
|
3698
|
-
FrtDeleter *frt_deleter_new(FrtSegmentInfos *sis, FrtStore *store)
|
3699
|
-
{
|
3695
|
+
FrtDeleter *frt_deleter_new(FrtSegmentInfos *sis, FrtStore *store) {
|
3700
3696
|
FrtDeleter *dlr = FRT_ALLOC(FrtDeleter);
|
3701
3697
|
dlr->sis = sis;
|
3702
3698
|
dlr->store = store;
|
@@ -3704,19 +3700,16 @@ FrtDeleter *frt_deleter_new(FrtSegmentInfos *sis, FrtStore *store)
|
|
3704
3700
|
return dlr;
|
3705
3701
|
}
|
3706
3702
|
|
3707
|
-
void frt_deleter_destroy(FrtDeleter *dlr)
|
3708
|
-
{
|
3703
|
+
void frt_deleter_destroy(FrtDeleter *dlr) {
|
3709
3704
|
frt_hs_destroy(dlr->pending);
|
3710
3705
|
free(dlr);
|
3711
3706
|
}
|
3712
3707
|
|
3713
|
-
|
3714
|
-
{
|
3708
|
+
void frt_deleter_queue_file(FrtDeleter *dlr, const char *file_name) {
|
3715
3709
|
frt_hs_add(dlr->pending, frt_estrdup(file_name));
|
3716
3710
|
}
|
3717
3711
|
|
3718
|
-
void frt_deleter_delete_file(FrtDeleter *dlr, char *file_name)
|
3719
|
-
{
|
3712
|
+
void frt_deleter_delete_file(FrtDeleter *dlr, char *file_name) {
|
3720
3713
|
FrtStore *store = dlr->store;
|
3721
3714
|
FRT_TRY
|
3722
3715
|
if (store->exists(store, file_name)) {
|
@@ -3728,8 +3721,7 @@ void frt_deleter_delete_file(FrtDeleter *dlr, char *file_name)
|
|
3728
3721
|
FRT_XENDTRY
|
3729
3722
|
}
|
3730
3723
|
|
3731
|
-
static void deleter_commit_pending_deletions(FrtDeleter *dlr)
|
3732
|
-
{
|
3724
|
+
static void deleter_commit_pending_deletions(FrtDeleter *dlr) {
|
3733
3725
|
FrtHashSetEntry *hse, *hse_next = dlr->pending->first;
|
3734
3726
|
while ((hse = hse_next) != NULL) {
|
3735
3727
|
hse_next = hse->next;
|
@@ -3737,23 +3729,13 @@ static void deleter_commit_pending_deletions(FrtDeleter *dlr)
|
|
3737
3729
|
}
|
3738
3730
|
}
|
3739
3731
|
|
3740
|
-
void frt_deleter_delete_files(FrtDeleter *dlr, char **files, int file_cnt)
|
3741
|
-
{
|
3742
|
-
int i;
|
3743
|
-
for (i = file_cnt - 1; i >= 0; i--) {
|
3744
|
-
deleter_queue_file(dlr, files[i]);
|
3745
|
-
}
|
3746
|
-
deleter_commit_pending_deletions(dlr);
|
3747
|
-
}
|
3748
|
-
|
3749
3732
|
struct DelFilesArg {
|
3750
3733
|
char curr_seg_file_name[FRT_SEGMENT_NAME_MAX_LENGTH];
|
3751
3734
|
FrtDeleter *dlr;
|
3752
3735
|
FrtHash *current;
|
3753
3736
|
};
|
3754
3737
|
|
3755
|
-
static void frt_deleter_find_deletable_files_i(const char *file_name, void *arg)
|
3756
|
-
{
|
3738
|
+
static void frt_deleter_find_deletable_files_i(const char *file_name, void *arg) {
|
3757
3739
|
struct DelFilesArg *dfa = (struct DelFilesArg *)arg;
|
3758
3740
|
FrtDeleter *dlr = dfa->dlr;
|
3759
3741
|
|
@@ -3773,8 +3755,7 @@ static void frt_deleter_find_deletable_files_i(const char *file_name, void *arg)
|
|
3773
3755
|
if (NULL != p) {
|
3774
3756
|
*p = '\0';
|
3775
3757
|
extension = p + 1;
|
3776
|
-
}
|
3777
|
-
else {
|
3758
|
+
} else {
|
3778
3759
|
extension = NULL;
|
3779
3760
|
}
|
3780
3761
|
|
@@ -3789,16 +3770,14 @@ static void frt_deleter_find_deletable_files_i(const char *file_name, void *arg)
|
|
3789
3770
|
if (NULL == (si = (FrtSegmentInfo *)frt_h_get(dfa->current, segment_name))) {
|
3790
3771
|
/* Delete if segment is not referenced: */
|
3791
3772
|
do_delete = true;
|
3792
|
-
}
|
3793
|
-
else {
|
3773
|
+
} else {
|
3794
3774
|
char tmp_fn[FRT_SEGMENT_NAME_MAX_LENGTH];
|
3795
3775
|
/* OK, segment is referenced, but file may still be orphan'd: */
|
3796
3776
|
if (file_name_filter_is_cfs_file(file_name)
|
3797
3777
|
&& si->use_compound_file) {
|
3798
3778
|
/* This file is stored in a CFS file for this segment: */
|
3799
3779
|
do_delete = true;
|
3800
|
-
}
|
3801
|
-
else if (0 == strcmp("del", extension)) {
|
3780
|
+
} else if (0 == strcmp("del", extension)) {
|
3802
3781
|
/* This is a _segmentName_N.del file: */
|
3803
3782
|
if (!frt_fn_for_generation(tmp_fn, segment_name, "del", si->del_gen)
|
3804
3783
|
|| 0 != strcmp(file_name, tmp_fn)) {
|
@@ -3807,8 +3786,7 @@ static void frt_deleter_find_deletable_files_i(const char *file_name, void *arg)
|
|
3807
3786
|
* this segment, then delete it: */
|
3808
3787
|
do_delete = true;
|
3809
3788
|
}
|
3810
|
-
}
|
3811
|
-
else if (NULL != extension
|
3789
|
+
} else if (NULL != extension
|
3812
3790
|
&& ('s' == *extension || 'f' == *extension)
|
3813
3791
|
&& isdigit(extension[1])) {
|
3814
3792
|
si_norm_file_name(si, tmp_fn, atoi(extension + 1));
|
@@ -3817,15 +3795,14 @@ static void frt_deleter_find_deletable_files_i(const char *file_name, void *arg)
|
|
3817
3795
|
/* This is an orphan'd norms file: */
|
3818
3796
|
do_delete = true;
|
3819
3797
|
}
|
3820
|
-
}
|
3821
|
-
else if (0 == strcmp("cfs", extension) && !si->use_compound_file) {
|
3798
|
+
} else if (0 == strcmp("cfs", extension) && !si->use_compound_file) {
|
3822
3799
|
/* This is a partially written _segmentName.cfs: */
|
3823
3800
|
do_delete = true;
|
3824
3801
|
}
|
3825
3802
|
}
|
3826
3803
|
|
3827
3804
|
if (do_delete) {
|
3828
|
-
|
3805
|
+
frt_deleter_queue_file(dlr, file_name);
|
3829
3806
|
}
|
3830
3807
|
}
|
3831
3808
|
}
|
@@ -3837,8 +3814,7 @@ static void frt_deleter_find_deletable_files_i(const char *file_name, void *arg)
|
|
3837
3814
|
* create the unused file (eg when merging segments), and we only remove from
|
3838
3815
|
* deletable when a file is successfully deleted.
|
3839
3816
|
*/
|
3840
|
-
void frt_deleter_find_deletable_files(FrtDeleter *dlr)
|
3841
|
-
{
|
3817
|
+
void frt_deleter_find_deletable_files(FrtDeleter *dlr) {
|
3842
3818
|
/* Gather all "current" segments: */
|
3843
3819
|
int i;
|
3844
3820
|
FrtSegmentInfos *sis = dlr->sis;
|
@@ -4207,7 +4183,7 @@ static void norm_rewrite(Norm *norm, FrtStore *store, FrtDeleter *dlr,
|
|
4207
4183
|
const int field_num = norm->field_num;
|
4208
4184
|
|
4209
4185
|
if (si_norm_file_name(si, norm_file_name, field_num)) {
|
4210
|
-
|
4186
|
+
frt_deleter_queue_file(dlr, norm_file_name);
|
4211
4187
|
}
|
4212
4188
|
frt_si_advance_norm_gen(si, field_num);
|
4213
4189
|
si_norm_file_name(si, norm_file_name, field_num);
|
@@ -4363,7 +4339,7 @@ static void sr_commit_i(FrtIndexReader *ir)
|
|
4363
4339
|
if (SR(ir)->undelete_all || SR(ir)->deleted_docs_dirty) {
|
4364
4340
|
if (si->del_gen >= 0) {
|
4365
4341
|
frt_fn_for_generation(tmp_file_name, segment, "del", si->del_gen);
|
4366
|
-
|
4342
|
+
frt_deleter_queue_file(ir->deleter, tmp_file_name);
|
4367
4343
|
}
|
4368
4344
|
if (SR(ir)->undelete_all) {
|
4369
4345
|
si->del_gen = -1;
|
@@ -5687,7 +5663,6 @@ static SegmentMergeInfo *smi_new(int base, FrtStore *store, FrtSegmentInfo *si)
|
|
5687
5663
|
smi->store = frt_open_cmpd_store(store, file_name);
|
5688
5664
|
}
|
5689
5665
|
|
5690
|
-
|
5691
5666
|
sprintf(file_name, "%s.fdx", segment);
|
5692
5667
|
smi->doc_cnt = smi->max_doc
|
5693
5668
|
= smi->store->length(smi->store, file_name) / FIELDS_IDX_PTR_SIZE;
|
@@ -6116,14 +6091,7 @@ int frt_iw_doc_count(FrtIndexWriter *iw)
|
|
6116
6091
|
return doc_cnt;
|
6117
6092
|
}
|
6118
6093
|
|
6119
|
-
|
6120
|
-
deleter_queue_file(dlr, file_name);\
|
6121
|
-
frt_cw_add_file(cw, file_name)
|
6122
|
-
|
6123
|
-
static void iw_create_compound_file(FrtStore *store, FrtFieldInfos *fis,
|
6124
|
-
FrtSegmentInfo *si, char *cfs_file_name,
|
6125
|
-
FrtDeleter *dlr)
|
6126
|
-
{
|
6094
|
+
static void iw_create_compound_file(FrtStore *store, FrtFieldInfos *fis, FrtSegmentInfo *si, char *cfs_file_name, FrtDeleter *dlr) {
|
6127
6095
|
int i;
|
6128
6096
|
FrtCompoundWriter *cw;
|
6129
6097
|
char file_name[FRT_SEGMENT_NAME_MAX_LENGTH];
|
@@ -6137,19 +6105,18 @@ static void iw_create_compound_file(FrtStore *store, FrtFieldInfos *fis,
|
|
6137
6105
|
cw = frt_open_cw(store, cfs_file_name);
|
6138
6106
|
for (i = 0; i < FRT_NELEMS(COMPOUND_EXTENSIONS); i++) {
|
6139
6107
|
memcpy(ext, COMPOUND_EXTENSIONS[i], 4);
|
6140
|
-
|
6108
|
+
frt_cw_add_file(cw, file_name);
|
6141
6109
|
}
|
6142
6110
|
|
6143
6111
|
/* Field norm file_names */
|
6144
6112
|
for (i = fis->size - 1; i >= 0; i--) {
|
6145
|
-
if (fi_has_norms(fis->fields[i])
|
6146
|
-
|
6147
|
-
MOVE_TO_COMPOUND_DIR(file_name);
|
6113
|
+
if (fi_has_norms(fis->fields[i]) && si_norm_file_name(si, file_name, i)) {
|
6114
|
+
frt_cw_add_file(cw, file_name);
|
6148
6115
|
}
|
6149
6116
|
}
|
6150
6117
|
|
6151
6118
|
/* Perform the merge */
|
6152
|
-
frt_cw_close(cw);
|
6119
|
+
frt_cw_close(cw, dlr);
|
6153
6120
|
}
|
6154
6121
|
|
6155
6122
|
static void iw_commit_compound_file(FrtIndexWriter *iw, FrtSegmentInfo *si)
|
@@ -627,9 +627,9 @@ struct FrtDeleter {
|
|
627
627
|
|
628
628
|
extern FrtDeleter *frt_deleter_new(FrtSegmentInfos *sis, FrtStore *store);
|
629
629
|
extern void frt_deleter_destroy(FrtDeleter *dlr);
|
630
|
+
extern void frt_deleter_queue_file(FrtDeleter *dlr, const char *file_name);
|
630
631
|
extern void frt_deleter_delete_file(FrtDeleter *dlr, char *file_name);
|
631
632
|
extern void frt_deleter_find_deletable_files(FrtDeleter *dlr);
|
632
|
-
extern void frt_deleter_delete_files(FrtDeleter *dlr, char **files, int file_cnt);
|
633
633
|
|
634
634
|
/****************************************************************************
|
635
635
|
*
|
@@ -859,6 +859,6 @@ typedef struct FrtCompoundWriter {
|
|
859
859
|
|
860
860
|
extern FrtCompoundWriter *frt_open_cw(FrtStore *store, char *name);
|
861
861
|
extern void frt_cw_add_file(FrtCompoundWriter *cw, char *id);
|
862
|
-
extern void frt_cw_close(FrtCompoundWriter *cw);
|
862
|
+
extern void frt_cw_close(FrtCompoundWriter *cw, FrtDeleter *dlr);
|
863
863
|
|
864
864
|
#endif
|
@@ -810,7 +810,7 @@ void Init_Test(void) {
|
|
810
810
|
rb_define_singleton_method(mTest, "filter", frb_ts_filter, 0);
|
811
811
|
rb_define_singleton_method(mTest, "fs_store", frb_ts_fs_store, 0);
|
812
812
|
rb_define_singleton_method(mTest, "global", frb_ts_global, 0);
|
813
|
-
rb_define_singleton_method(mTest, "
|
813
|
+
rb_define_singleton_method(mTest, "test_hash", frb_ts_hash, 0);
|
814
814
|
rb_define_singleton_method(mTest, "hashset", frb_ts_hashset, 0);
|
815
815
|
rb_define_singleton_method(mTest, "helper", frb_ts_helper, 0);
|
816
816
|
rb_define_singleton_method(mTest, "highlighter", frb_ts_highlighter, 0);
|
@@ -48,7 +48,7 @@ void test_compound_writer(TestCase *tc, void *data)
|
|
48
48
|
cw = frt_open_cw(store, (char *)"cfile");
|
49
49
|
frt_cw_add_file(cw, (char *)"file1");
|
50
50
|
frt_cw_add_file(cw, (char *)"file2");
|
51
|
-
frt_cw_close(cw);
|
51
|
+
frt_cw_close(cw, NULL);
|
52
52
|
|
53
53
|
is = store->open_input(store, "cfile");
|
54
54
|
Aiequal(2, frt_is_read_vint(is));
|
@@ -94,7 +94,7 @@ void test_compound_io(TestCase *tc, void *data)
|
|
94
94
|
frt_cw_add_file(cw, (char *)"file1");
|
95
95
|
frt_cw_add_file(cw, (char *)"file2");
|
96
96
|
frt_cw_add_file(cw, (char *)"file3");
|
97
|
-
frt_cw_close(cw);
|
97
|
+
frt_cw_close(cw, NULL);
|
98
98
|
|
99
99
|
c_reader = frt_open_cmpd_store(store, "cfile");
|
100
100
|
is1 = c_reader->open_input(c_reader, "file1");
|
@@ -137,7 +137,7 @@ void test_compound_io_many_files(TestCase *tc, void *data)
|
|
137
137
|
frt_os_write_vint(os, MAGIC);
|
138
138
|
frt_os_close(os);
|
139
139
|
}
|
140
|
-
frt_cw_close(cw);
|
140
|
+
frt_cw_close(cw, NULL);
|
141
141
|
|
142
142
|
c_reader = frt_open_cmpd_store(store, "_.cfs");
|
143
143
|
for (i = 0; i < TEST_FILE_CNT; i++) {
|
metadata
CHANGED
@@ -1,14 +1,14 @@
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
2
2
|
name: isomorfeus-ferret
|
3
3
|
version: !ruby/object:Gem::Version
|
4
|
-
version: 0.13.
|
4
|
+
version: 0.13.6
|
5
5
|
platform: ruby
|
6
6
|
authors:
|
7
7
|
- Jan Biedermann
|
8
8
|
autorequire:
|
9
9
|
bindir: bin
|
10
10
|
cert_chain: []
|
11
|
-
date: 2022-04-
|
11
|
+
date: 2022-04-26 00:00:00.000000000 Z
|
12
12
|
dependencies:
|
13
13
|
- !ruby/object:Gem::Dependency
|
14
14
|
name: rake
|