1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321 322 323 324 325 326 327 328 329 330 331 332 333 334 335 336 337 338 339 340 341 342 343 344 345 346 347 348 349 350 351 352 353 354 355 356 357 358 359 360 361 362 363 364 365 366 367 368 369 370 371 372 373 374 375 376 377 378 379 380 381 382 383 384 385 386 387 388 389 390 391 392 393 394 395 396 397 398 399 400 401 402 403 404 405 406 407 408 409 410 411 412 413 414 415 416 417 418 419 420 421 422 423 424 425 426 427 428 429 430 431 432 433 434 435 436 437 438 439 440 441 442 443 444 445 446 447 448 449 450 451 452 453 454 455 456 457 458
|
/** @file dbcheck.cc
* @brief Check the consistency of a database or table.
*/
/* Copyright 1999,2000,2001 BrightStation PLC
* Copyright 2002,2003,2004,2005,2006,2007,2008,2009,2010,2011,2012,2013,2014,2015,2016 Olly Betts
*
* This program is free software; you can redistribute it and/or
* modify it under the terms of the GNU General Public License as
* published by the Free Software Foundation; either version 2 of the
* License, or (at your option) any later version.
*
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License
* along with this program; if not, write to the Free Software
* Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301
* USA
*/
#include <config.h>
#include "xapian/database.h"
#include "xapian/constants.h"
#include "xapian/error.h"
#ifdef XAPIAN_HAS_GLASS_BACKEND
#include "glass/glass_changes.h"
#include "glass/glass_database.h"
#include "glass/glass_dbcheck.h"
#include "glass/glass_version.h"
#endif
#ifdef XAPIAN_HAS_CHERT_BACKEND
#include "chert/chert_database.h"
#include "chert/chert_dbcheck.h"
#include "chert/chert_types.h"
#include "chert/chert_version.h"
#endif
#include "filetests.h"
#include "omassert.h"
#include "posixy_wrapper.h"
#include "stringutils.h"
#include <ostream>
#include <stdexcept>
using namespace std;
#ifdef XAPIAN_HAS_GLASS_BACKEND
// Tables to check for a glass database. Note: it's important to check
// termlist before postlist so that we can cross-check the document lengths.
static const struct { char name[9]; } glass_tables[] = {
{ "docdata" },
{ "termlist" },
{ "postlist" },
{ "position" },
{ "spelling" },
{ "synonym" }
};
#endif
static bool
check_if_single_file_db(const struct stat & sb, const string & path,
int * fd_ptr = NULL)
{
#ifdef XAPIAN_HAS_GLASS_BACKEND
if (!S_ISREG(sb.st_mode)) return false;
// Look at the size as a clue - if it's 0 or not a multiple of 2048,
// then it's not a single-file glass database. If it is, peek at the start
// of the file to determine which it is.
if (sb.st_size == 0 || sb.st_size % 2048 != 0) return false;
int fd = posixy_open(path.c_str(), O_RDONLY|O_BINARY);
if (fd != -1) {
char magic_buf[14];
// FIXME: Don't duplicate magic check here...
if (io_read(fd, magic_buf, 14) == 14 &&
(!fd_ptr || lseek(fd, 0, SEEK_SET) == 0) &&
memcmp(magic_buf, "\x0f\x0dXapian Glass", 14) == 0) {
if (fd_ptr) {
*fd_ptr = fd;
} else {
::close(fd);
}
return true;
}
::close(fd);
}
#else
(void)sb;
(void)path;
(void)fd_ptr;
#endif
return false;
}
// FIXME: We don't currently cross-check wdf between postlist and termlist.
// It's hard to see how to efficiently. We do cross-check doclens, but that
// "only" requires (4 * last_docid()) bytes.
#if defined XAPIAN_HAS_CHERT_BACKEND || defined XAPIAN_HAS_GLASS_BACKEND
static void
reserve_doclens(vector<Xapian::termcount>& doclens, Xapian::docid last_docid,
ostream * out)
{
if (last_docid >= 0x40000000ul / sizeof(Xapian::termcount)) {
// The memory block needed by the vector would be >= 1GB.
if (out)
*out << "Cross-checking document lengths between the postlist and "
"termlist tables would use more than 1GB of memory, so "
"skipping that check" << endl;
return;
}
try {
doclens.reserve(last_docid + 1);
} catch (const std::bad_alloc &) {
// Failed to allocate the required memory.
if (out)
*out << "Couldn't allocate enough memory for cross-checking document "
"lengths between the postlist and termlist tables, so "
"skipping that check" << endl;
} catch (const std::length_error &) {
// There are too many elements for the vector to handle!
if (out)
*out << "Couldn't allocate enough elements for cross-checking document "
"lengths between the postlist and termlist tables, so "
"skipping that check" << endl;
}
}
#endif
static size_t
check_db_dir(const string & path, int opts, std::ostream *out)
{
struct stat sb;
if (stat((path + "/iamchert").c_str(), &sb) == 0) {
#ifndef XAPIAN_HAS_CHERT_BACKEND
(void)opts;
(void)out;
throw Xapian::FeatureUnavailableError("Chert database support isn't enabled");
#else
// Check a whole chert database directory.
vector<Xapian::termcount> doclens;
size_t errors = 0;
// If we can't read the doccount or last docid, set them to their
// maximum values to suppress errors.
Xapian::doccount doccount = Xapian::doccount(-1);
Xapian::docid db_last_docid = CHERT_MAX_DOCID;
chert_revision_number_t rev = 0;
chert_revision_number_t * rev_ptr = &rev;
try {
// Open at the lower level so we can get the revision number.
ChertDatabase db(path);
doccount = db.get_doccount();
db_last_docid = db.get_lastdocid();
reserve_doclens(doclens, db_last_docid, out);
rev = db.get_revision_number();
} catch (const Xapian::Error & e) {
// Ignore so we can check a database too broken to open.
if (out)
*out << "Database couldn't be opened for reading: "
<< e.get_description()
<< "\nContinuing check anyway" << endl;
++errors;
}
size_t pre_table_check_errors = errors;
// Check all the btrees.
//
// Note: it's important to check "termlist" before "postlist" so
// that we can cross-check the document lengths; also we check
// "record" first as that's the last committed, so has the most
// reliable rootblock revision in DBCHECK_FIX mode.
static const struct { char name[9]; } tables[] = {
{ "record" },
{ "termlist" },
{ "postlist" },
{ "position" },
{ "spelling" },
{ "synonym" }
};
for (auto t : tables) {
const char * name = t.name;
string table(path);
table += '/';
table += name;
if (out)
*out << name << ":\n";
if (strcmp(name, "record") != 0 && strcmp(name, "postlist") != 0) {
// Other tables are created lazily, so may not exist.
if (!file_exists(table + ".DB")) {
if (out) {
if (strcmp(name, "termlist") == 0) {
*out << "Not present.\n";
} else {
*out << "Lazily created, and not yet used.\n";
}
*out << endl;
}
continue;
}
}
errors += check_chert_table(name, table, rev_ptr, opts, doclens,
doccount, db_last_docid, out);
}
if (errors == pre_table_check_errors && (opts & Xapian::DBCHECK_FIX)) {
// Check the version file is OK and if not, recreate it.
ChertVersion iam(path);
try {
iam.read_and_check();
} catch (const Xapian::DatabaseError &) {
iam.create();
}
}
return errors;
#endif
}
if (stat((path + "/iamglass").c_str(), &sb) == 0) {
#ifndef XAPIAN_HAS_GLASS_BACKEND
(void)opts;
(void)out;
throw Xapian::FeatureUnavailableError("Glass database support isn't enabled");
#else
// Check a whole glass database directory.
vector<Xapian::termcount> doclens;
size_t errors = 0;
try {
// Check if the database can actually be opened.
Xapian::Database db(path);
} catch (const Xapian::Error & e) {
// Continue - we can still usefully look at how it is broken.
if (out)
*out << "Database couldn't be opened for reading: "
<< e.get_description()
<< "\nContinuing check anyway" << endl;
++errors;
}
GlassVersion version_file(path);
version_file.read();
for (glass_revision_number_t r = version_file.get_revision(); r != 0; --r) {
string changes_file = path;
changes_file += "/changes";
changes_file += str(r);
if (file_exists(changes_file))
GlassChanges::check(changes_file);
}
Xapian::docid doccount = version_file.get_doccount();
Xapian::docid db_last_docid = version_file.get_last_docid();
if (db_last_docid < doccount) {
if (out)
*out << "last_docid = " << db_last_docid << " < doccount = "
<< doccount << endl;
++errors;
}
reserve_doclens(doclens, db_last_docid, out);
// Check all the tables.
for (auto t : glass_tables) {
errors += check_glass_table(t.name, path, version_file, opts,
doclens, out);
}
return errors;
#endif
}
if (stat((path + "/iamflint").c_str(), &sb) == 0) {
// Flint is no longer supported as of Xapian 1.3.0.
throw Xapian::FeatureUnavailableError("Flint database support was removed in Xapian 1.3.0");
}
if (stat((path + "/iambrass").c_str(), &sb) == 0) {
// Brass was renamed to glass as of Xapian 1.3.2.
throw Xapian::FeatureUnavailableError("Brass database support was removed in Xapian 1.3.2");
}
if (stat((path + "/record_DB").c_str(), &sb) == 0) {
// Quartz is no longer supported as of Xapian 1.1.0.
throw Xapian::FeatureUnavailableError("Quartz database support was removed in Xapian 1.1.0");
}
throw Xapian::DatabaseError("Directory does not contain a Xapian database");
}
static size_t
check_if_db_table(const string & path, int opts, std::ostream *out)
{
// Just check a single Btree. If it ends with ".", ".DB", or ".glass",
// trim that so the user can do xapian-check on "foo", "foo.", "foo.DB",
// "foo.glass", etc.
enum { UNKNOWN, CHERT, GLASS } backend = UNKNOWN;
string filename = path;
if (endswith(filename, '.')) {
filename.resize(filename.size() - 1);
} else if (endswith(filename, ".DB")) {
filename.resize(filename.size() - CONST_STRLEN(".DB"));
backend = CHERT;
} else if (endswith(filename, ".glass")) {
filename.resize(filename.size() - CONST_STRLEN(".glass"));
backend = GLASS;
}
struct stat sb;
if (backend == UNKNOWN) {
if (stat((filename + ".DB").c_str(), &sb) == 0) {
// It could also be flint or brass, but we check for those below.
backend = CHERT;
} else if (stat((filename + ".glass").c_str(), &sb) == 0) {
backend = GLASS;
} else {
throw Xapian::DatabaseError("File is not a Xapian database or database table");
}
}
size_t p = filename.find_last_of('/');
#if defined __WIN32__ || defined __OS2__
if (p == string::npos) p = 0;
p = filename.find_last_of('\\', p);
#endif
if (p == string::npos) p = 0; else ++p;
string dir(filename, 0, p);
string tablename;
while (p != filename.size()) {
tablename += C_tolower(filename[p++]);
}
#if defined XAPIAN_HAS_CHERT_BACKEND || defined XAPIAN_HAS_GLASS_BACKEND
vector<Xapian::termcount> doclens;
#else
(void)opts;
(void)out;
#endif
if (backend == GLASS) {
#ifndef XAPIAN_HAS_GLASS_BACKEND
throw Xapian::FeatureUnavailableError("Glass database support isn't enabled");
#else
GlassVersion version_file(dir);
version_file.read();
return check_glass_table(tablename.c_str(), dir, version_file, opts,
doclens, out);
#endif
}
Assert(backend == CHERT);
// Flint and brass also used the extension ".DB", so check that we
// haven't been passed a single table in a flint or brass database.
if (stat((dir + "/iamflint").c_str(), &sb) == 0) {
// Flint is no longer supported as of Xapian 1.3.0.
throw Xapian::FeatureUnavailableError("Flint database support was removed in Xapian 1.3.0");
}
if (stat((dir + "/iambrass").c_str(), &sb) == 0) {
// Brass was renamed to glass as of Xapian 1.3.2.
throw Xapian::FeatureUnavailableError("Brass database support was removed in Xapian 1.3.2");
}
#ifndef XAPIAN_HAS_CHERT_BACKEND
throw Xapian::FeatureUnavailableError("Chert database support isn't enabled");
#else
// Set the doccount and the last docid to their maximum values to suppress
// errors.
return check_chert_table(tablename.c_str(), filename, NULL, opts, doclens,
Xapian::doccount(-1), CHERT_MAX_DOCID, out);
#endif
}
/** Check a single file DB from an fd.
*
* Closes the fd (via GlassVersion doing so in its destructor).
*/
static size_t
check_db_fd(int fd, int opts, std::ostream *out)
{
#ifndef XAPIAN_HAS_GLASS_BACKEND
(void)opts;
(void)out;
::close(fd);
throw Xapian::FeatureUnavailableError("Glass database support isn't enabled");
#else
// Check a single-file glass database.
GlassVersion version_file(fd);
version_file.read();
size_t errors = 0;
Xapian::docid doccount = version_file.get_doccount();
Xapian::docid db_last_docid = version_file.get_last_docid();
if (db_last_docid < doccount) {
if (out)
*out << "last_docid = " << db_last_docid << " < doccount = "
<< doccount << endl;
++errors;
}
vector<Xapian::termcount> doclens;
reserve_doclens(doclens, db_last_docid, out);
// Check all the tables.
for (auto t : glass_tables) {
errors += check_glass_table(t.name, fd, version_file.get_offset(),
version_file, opts, doclens,
out);
}
return errors;
#endif
}
static size_t
check_db_file(const string & path, const struct stat & sb, int opts, std::ostream *out)
{
int fd;
if (check_if_single_file_db(sb, path, &fd)) {
return check_db_fd(fd, opts, out);
}
return check_if_db_table(path, opts, out);
}
namespace Xapian {
size_t
Database::check_(const string * path_ptr, int fd, int opts, std::ostream *out)
{
if (!out) {
// If we have nowhere to write output, then disable all the options
// which only affect what we output.
opts &= Xapian::DBCHECK_FIX;
}
if (path_ptr == NULL) {
return check_db_fd(fd, opts, out);
}
const string & path = *path_ptr;
struct stat sb;
if (stat(path.c_str(), &sb) == 0) {
if (S_ISDIR(sb.st_mode)) {
return check_db_dir(path, opts, out);
}
if (S_ISREG(sb.st_mode)) {
return check_db_file(path, sb, opts, out);
}
throw Xapian::DatabaseError("Not a regular file or directory");
}
return check_if_db_table(path, opts, out);
}
}
|