1 /** @file api_compactold.cc
2 * @brief Tests of old compaction API
4 /* Copyright (C) 2009,2010,2011,2012,2013,2015 Olly Betts
5 * Copyright (C) 2010 Richard Boulton
7 * This program is free software; you can redistribute it and/or
8 * modify it under the terms of the GNU General Public License as
9 * published by the Free Software Foundation; either version 2 of the
10 * License, or (at your option) any later version.
12 * This program is distributed in the hope that it will be useful,
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
15 * GNU General Public License for more details.
17 * You should have received a copy of the GNU General Public License
18 * along with this program; if not, write to the Free Software
19 * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301
25 #include "api_compactold.h"
27 #define XAPIAN_DEPRECATED(X) X
32 #include "filetests.h"
34 #include "testsuite.h"
35 #include "testutils.h"
45 make_sparse_db(Xapian::WritableDatabase
&db
, const string
& s
)
47 // Need non-const pointer for strtoul(), but data isn't modified.
48 char * p
= const_cast<char *>(s
.c_str());
51 bool del
= (*p
== '!');
53 Xapian::docid first
= strtoul(p
, &p
, 10);
54 Xapian::docid last
= first
;
56 last
= strtoul(p
+ 1, &p
, 10);
58 if (*p
&& *p
!= ' ') {
59 tout
<< p
- s
.c_str() << endl
;
60 FAIL_TEST("Bad sparse db spec (expected space): " << s
);
63 FAIL_TEST("Bad sparse db spec (first > last): " << s
);
68 db
.delete_document(first
);
71 string id
= str(first
);
73 doc
.add_term("Q" + str(first
));
74 doc
.add_term(string(first
% 7 + 1, char((first
% 26) + 'a')));
75 db
.replace_document(first
, doc
);
77 } while (first
++ < last
);
79 if (*p
== '\0') break;
87 check_sparse_uid_terms(const string
& path
)
89 Xapian::Database
db(path
);
90 Xapian::TermIterator t
;
91 for (t
= db
.allterms_begin("Q"); t
!= db
.allterms_end("Q"); ++t
) {
92 Xapian::docid did
= atoi((*t
).c_str() + 1);
93 Xapian::PostingIterator p
= db
.postlist_begin(*t
);
98 DEFINE_TESTCASE(compactoldnorenumber1
, generated
) {
99 string a
= get_database_path("compactnorenumber1a", make_sparse_db
,
100 "5-7 24 76 987 1023-1027 9999 !9999");
103 Xapian::Database
db(a
);
104 a_uuid
= db
.get_uuid();
106 string b
= get_database_path("compactnorenumber1b", make_sparse_db
,
108 string c
= get_database_path("compactnorenumber1c", make_sparse_db
,
110 string d
= get_database_path("compactnorenumber1d", make_sparse_db
,
111 "3000 999999 !999999");
113 string out
= get_named_writable_database_path("compactnorenumber1out");
117 Xapian::Compactor compact
;
118 compact
.set_renumber(false);
119 compact
.set_destdir(out
);
120 compact
.add_source(a
);
124 check_sparse_uid_terms(out
);
127 TEST(!dir_exists(out
+ "/donor"));
128 Xapian::Database
db(out
);
129 // xapian-compact should change the UUID of the database, but didn't
130 // prior to 1.0.18/1.1.4.
131 string out_uuid
= db
.get_uuid();
132 TEST_NOT_EQUAL(a_uuid
, out_uuid
);
133 TEST_EQUAL(out_uuid
.size(), 36);
134 TEST_NOT_EQUAL(out_uuid
, "00000000-0000-0000-0000-000000000000");
136 // White box test - ensure that the donor database is removed.
137 TEST(!dir_exists(out
+ "/donor"));
142 Xapian::Compactor compact
;
143 compact
.set_renumber(false);
144 compact
.set_destdir(out
);
145 compact
.add_source(a
);
146 compact
.add_source(c
);
149 check_sparse_uid_terms(out
);
151 // Check that xapian-compact is producing a consistent database. Also,
152 // regression test - xapian 1.1.4 set lastdocid to 0 in the output
154 Xapian::Database
outdb(out
);
155 dbcheck(outdb
, 24, 9999);
160 Xapian::Compactor compact
;
161 compact
.set_renumber(false);
162 compact
.set_destdir(out
);
163 compact
.add_source(d
);
164 compact
.add_source(a
);
165 compact
.add_source(c
);
168 check_sparse_uid_terms(out
);
172 Xapian::Compactor compact
;
173 compact
.set_renumber(false);
174 compact
.set_destdir(out
);
175 compact
.add_source(c
);
176 compact
.add_source(a
);
177 compact
.add_source(d
);
180 check_sparse_uid_terms(out
);
185 Xapian::Compactor compact
;
186 compact
.set_renumber(false);
187 compact
.set_destdir(out
);
188 compact
.add_source(a
);
189 compact
.add_source(b
);
190 TEST_EXCEPTION(Xapian::InvalidOperationError
, compact
.compact());
196 Xapian::Compactor compact
;
197 compact
.set_renumber(false);
198 compact
.set_destdir(out
);
199 compact
.add_source(b
);
200 compact
.add_source(a
);
201 TEST_EXCEPTION(Xapian::InvalidOperationError
, compact
.compact());
207 Xapian::Compactor compact
;
208 compact
.set_renumber(false);
209 compact
.set_destdir(out
);
210 compact
.add_source(a
);
211 compact
.add_source(b
);
212 compact
.add_source(d
);
213 TEST_EXCEPTION(Xapian::InvalidOperationError
, compact
.compact());
219 Xapian::Compactor compact
;
220 compact
.set_renumber(false);
221 compact
.set_destdir(out
);
222 compact
.add_source(d
);
223 compact
.add_source(b
);
224 compact
.add_source(a
);
225 TEST_EXCEPTION(Xapian::InvalidOperationError
, compact
.compact());
231 Xapian::Compactor compact
;
232 compact
.set_renumber(false);
233 compact
.set_destdir(out
);
234 compact
.add_source(b
);
235 compact
.add_source(a
);
236 compact
.add_source(d
);
237 TEST_EXCEPTION(Xapian::InvalidOperationError
, compact
.compact());
243 // Test use of compact to merge two databases.
244 DEFINE_TESTCASE(compactoldmerge1
, glass
) {
245 string indbpath
= get_database_path("apitest_simpledata");
246 string outdbpath
= get_named_writable_database_path("compactmerge1out");
249 Xapian::Compactor compact
;
250 compact
.set_destdir(outdbpath
);
251 compact
.add_source(indbpath
);
252 compact
.add_source(indbpath
);
255 Xapian::Database
indb(get_database("apitest_simpledata"));
256 Xapian::Database
outdb(outdbpath
);
258 TEST_EQUAL(indb
.get_doccount() * 2, outdb
.get_doccount());
259 dbcheck(outdb
, outdb
.get_doccount(), outdb
.get_doccount());
265 make_multichunk_db(Xapian::WritableDatabase
&db
, const string
&)
269 Xapian::Document doc
;
272 db
.add_document(doc
);
279 // Test use of compact on a database which has multiple chunks for a term.
280 // This is a regression test for ticket #427
281 DEFINE_TESTCASE(compactoldmultichunks1
, generated
) {
282 string indbpath
= get_database_path("compactmultichunks1in",
283 make_multichunk_db
, "");
284 string outdbpath
= get_named_writable_database_path("compactmultichunks1out");
287 Xapian::Compactor compact
;
288 compact
.set_destdir(outdbpath
);
289 compact
.add_source(indbpath
);
292 Xapian::Database
indb(indbpath
);
293 Xapian::Database
outdb(outdbpath
);
295 TEST_EQUAL(indb
.get_doccount(), outdb
.get_doccount());
296 dbcheck(outdb
, outdb
.get_doccount(), outdb
.get_doccount());
301 // Test compacting from a stub database directory.
302 DEFINE_TESTCASE(compactoldstub1
, glass
) {
303 const char * stubpath
= ".stub/compactstub1";
304 const char * stubpathfile
= ".stub/compactstub1/XAPIANDB";
305 mkdir(".stub", 0755);
306 mkdir(stubpath
, 0755);
307 ofstream
stub(stubpathfile
);
308 TEST(stub
.is_open());
309 stub
<< "auto ../../" << get_database_path("apitest_simpledata") << endl
;
310 stub
<< "auto ../../" << get_database_path("apitest_simpledata2") << endl
;
313 string outdbpath
= get_named_writable_database_path("compactstub1out");
316 Xapian::Compactor compact
;
317 compact
.set_destdir(outdbpath
);
318 compact
.add_source(stubpath
);
321 Xapian::Database
indb(stubpath
);
322 Xapian::Database
outdb(outdbpath
);
324 TEST_EQUAL(indb
.get_doccount(), outdb
.get_doccount());
325 dbcheck(outdb
, outdb
.get_doccount(), outdb
.get_doccount());
330 // Test compacting from a stub database file.
331 DEFINE_TESTCASE(compactoldstub2
, glass
) {
332 const char * stubpath
= ".stub/compactstub2";
333 mkdir(".stub", 0755);
334 ofstream
stub(stubpath
);
335 TEST(stub
.is_open());
336 stub
<< "auto ../" << get_database_path("apitest_simpledata") << endl
;
337 stub
<< "auto ../" << get_database_path("apitest_simpledata2") << endl
;
340 string outdbpath
= get_named_writable_database_path("compactstub2out");
343 Xapian::Compactor compact
;
344 compact
.set_destdir(outdbpath
);
345 compact
.add_source(stubpath
);
348 Xapian::Database
indb(stubpath
);
349 Xapian::Database
outdb(outdbpath
);
351 TEST_EQUAL(indb
.get_doccount(), outdb
.get_doccount());
352 dbcheck(outdb
, outdb
.get_doccount(), outdb
.get_doccount());
357 // Test compacting a stub database file to itself.
358 DEFINE_TESTCASE(compactoldstub3
, glass
) {
359 const char * stubpath
= ".stub/compactstub3";
360 mkdir(".stub", 0755);
361 ofstream
stub(stubpath
);
362 TEST(stub
.is_open());
363 stub
<< "auto ../" << get_database_path("apitest_simpledata") << endl
;
364 stub
<< "auto ../" << get_database_path("apitest_simpledata2") << endl
;
367 Xapian::doccount in_docs
;
369 Xapian::Database
indb(stubpath
);
370 in_docs
= indb
.get_doccount();
373 Xapian::Compactor compact
;
374 compact
.set_destdir(stubpath
);
375 compact
.add_source(stubpath
);
378 Xapian::Database
outdb(stubpath
);
380 TEST_EQUAL(in_docs
, outdb
.get_doccount());
381 dbcheck(outdb
, outdb
.get_doccount(), outdb
.get_doccount());
386 // Test compacting a stub database directory to itself.
387 DEFINE_TESTCASE(compactoldstub4
, glass
) {
388 const char * stubpath
= ".stub/compactstub4";
389 const char * stubpathfile
= ".stub/compactstub4/XAPIANDB";
390 mkdir(".stub", 0755);
391 mkdir(stubpath
, 0755);
392 ofstream
stub(stubpathfile
);
393 TEST(stub
.is_open());
394 stub
<< "auto ../../" << get_database_path("apitest_simpledata") << endl
;
395 stub
<< "auto ../../" << get_database_path("apitest_simpledata2") << endl
;
398 Xapian::doccount in_docs
;
400 Xapian::Database
indb(stubpath
);
401 in_docs
= indb
.get_doccount();
404 Xapian::Compactor compact
;
405 compact
.set_destdir(stubpath
);
406 compact
.add_source(stubpath
);
409 Xapian::Database
outdb(stubpath
);
411 TEST_EQUAL(in_docs
, outdb
.get_doccount());
412 dbcheck(outdb
, outdb
.get_doccount(), outdb
.get_doccount());
418 make_all_tables(Xapian::WritableDatabase
&db
, const string
&)
420 Xapian::Document doc
;
422 db
.add_document(doc
);
423 db
.add_spelling("foo");
424 db
.add_synonym("bar", "pub");
425 db
.add_synonym("foobar", "foo");
431 make_missing_tables(Xapian::WritableDatabase
&db
, const string
&)
433 Xapian::Document doc
;
435 db
.add_document(doc
);
440 DEFINE_TESTCASE(compactoldmissingtables1
, generated
) {
441 string a
= get_database_path("compactmissingtables1a",
443 string b
= get_database_path("compactmissingtables1b",
444 make_missing_tables
);
446 string out
= get_named_writable_database_path("compactmissingtables1out");
449 Xapian::Compactor compact
;
450 compact
.set_destdir(out
);
451 compact
.add_source(a
);
452 compact
.add_source(b
);
456 Xapian::Database
db(out
);
457 TEST_NOT_EQUAL(db
.spellings_begin(), db
.spellings_end());
458 TEST_NOT_EQUAL(db
.synonym_keys_begin(), db
.synonym_keys_end());
459 // FIXME: arrange for input b to not have a termlist table.
460 // TEST_EXCEPTION(Xapian::FeatureUnavailableError, db.termlist_begin(1));
467 make_all_tables2(Xapian::WritableDatabase
&db
, const string
&)
469 Xapian::Document doc
;
471 db
.add_document(doc
);
472 db
.add_spelling("bar");
473 db
.add_synonym("bar", "baa");
474 db
.add_synonym("barfoo", "barbar");
475 db
.add_synonym("foofoo", "barfoo");
480 /// Adds coverage for merging synonym table.
481 DEFINE_TESTCASE(compactoldmergesynonym1
, generated
) {
482 string a
= get_database_path("compactmergesynonym1a",
484 string b
= get_database_path("compactmergesynonym1b",
487 string out
= get_named_writable_database_path("compactmergesynonym1out");
490 Xapian::Compactor compact
;
491 compact
.set_destdir(out
);
492 compact
.add_source(a
);
493 compact
.add_source(b
);
497 Xapian::Database
db(out
);
499 Xapian::TermIterator i
= db
.spellings_begin();
500 TEST_NOT_EQUAL(i
, db
.spellings_end());
501 TEST_EQUAL(*i
, "bar");
503 TEST_NOT_EQUAL(i
, db
.spellings_end());
504 TEST_EQUAL(*i
, "foo");
506 TEST_EQUAL(i
, db
.spellings_end());
508 i
= db
.synonym_keys_begin();
509 TEST_NOT_EQUAL(i
, db
.synonym_keys_end());
510 TEST_EQUAL(*i
, "bar");
512 TEST_NOT_EQUAL(i
, db
.synonym_keys_end());
513 TEST_EQUAL(*i
, "barfoo");
515 TEST_NOT_EQUAL(i
, db
.synonym_keys_end());
516 TEST_EQUAL(*i
, "foobar");
518 TEST_NOT_EQUAL(i
, db
.synonym_keys_end());
519 TEST_EQUAL(*i
, "foofoo");
521 TEST_EQUAL(i
, db
.synonym_keys_end());
527 DEFINE_TESTCASE(compactoldempty1
, glass
) {
528 string empty_dbpath
= get_database_path(string());
529 string outdbpath
= get_named_writable_database_path("compactempty1out");
533 // Compacting an empty database tried to divide by zero in 1.3.0.
534 Xapian::Compactor compact
;
535 compact
.set_destdir(outdbpath
);
536 compact
.add_source(empty_dbpath
);
539 Xapian::Database
outdb(outdbpath
);
540 TEST_EQUAL(outdb
.get_doccount(), 0);
541 dbcheck(outdb
, 0, 0);
545 // Check compacting two empty databases together.
546 Xapian::Compactor compact
;
547 compact
.set_destdir(outdbpath
);
548 compact
.add_source(empty_dbpath
);
549 compact
.add_source(empty_dbpath
);
552 Xapian::Database
outdb(outdbpath
);
553 TEST_EQUAL(outdb
.get_doccount(), 0);
554 dbcheck(outdb
, 0, 0);
560 DEFINE_TESTCASE(compactoldmultipass1
, glass
) {
561 string outdbpath
= get_named_writable_database_path("compactmultipass1");
564 string a
= get_database_path("compactnorenumber1a", make_sparse_db
,
565 "5-7 24 76 987 1023-1027 9999 !9999");
566 string b
= get_database_path("compactnorenumber1b", make_sparse_db
,
568 string c
= get_database_path("compactnorenumber1c", make_sparse_db
,
570 string d
= get_database_path("compactnorenumber1d", make_sparse_db
,
571 "3000 999999 !999999");
573 Xapian::Compactor compact
;
574 compact
.set_destdir(outdbpath
);
575 compact
.add_source(a
);
576 compact
.add_source(b
);
577 compact
.add_source(c
);
578 compact
.add_source(d
);
579 compact
.set_multipass(true);
582 Xapian::Database
outdb(outdbpath
);
583 dbcheck(outdb
, 29, 1041);