44 if (find_if(line.begin(), line.end(),
C_isnotspace) == line.end())
56 while (file != end || (
input.is_open() && !
input.eof())) {
57 if (
input.eof()) next_file();
65 string value0(
"X\0\0\0 \1\t" 66 "\x00\x01\x02\x03\x04\x05\x06\x07\x08\x09\x0a\x0b\x0c\x0d\x0e\x0f" 67 "\x10\x11\x12\x13\x14\x15\x16\x17\x18\x19\x1a\x1b\x1c\x1d\x1e\x1f" 68 "\x20\x21\x22\x23\x24\x25\x26\x27\x28\x29\x2a\x2b\x2c\x2d\x2e\x2f" 69 "\x30\x31\x32\x33\x34\x35\x36\x37\x38\x39\x3a\x3b\x3c\x3d\x3e\x3f" 70 "\x40\x41\x42\x43\x44\x45\x46\x47\x48\x49\x4a\x4b\x4c\x4d\x4e\x4f" 71 "\x50\x51\x52\x53\x54\x55\x56\x57\x58\x59\x5a\x5b\x5c\x5d\x5e\x5f" 72 "\x60\x61\x62\x63\x64\x65\x66\x67\x68\x69\x6a\x6b\x6c\x6d\x6e\x6f" 73 "\x70\x71\x72\x73\x74\x75\x76\x77\x78\x79\x7a\x7b\x7c\x7d\x7e\x7f" 74 "\x80\x81\x82\x83\x84\x85\x86\x87\x88\x89\x8a\x8b\x8c\x8d\x8e\x8f" 75 "\x90\x91\x92\x93\x94\x95\x96\x97\x98\x99\x9a\x9b\x9c\x9d\x9e\x9f" 76 "\xa0\xa1\xa2\xa3\xa4\xa5\xa6\xa7\xa8\xa9\xaa\xab\xac\xad\xae\xaf" 77 "\xb0\xb1\xb2\xb3\xb4\xb5\xb6\xb7\xb8\xb9\xba\xbb\xbc\xbd\xbe\xbf" 78 "\xc0\xc1\xc2\xc3\xc4\xc5\xc6\xc7\xc8\xc9\xca\xcb\xcc\xcd\xce\xcf" 79 "\xd0\xd1\xd2\xd3\xd4\xd5\xd6\xd7\xd8\xd9\xda\xdb\xdc\xdd\xde\xdf" 80 "\xe0\xe1\xe2\xe3\xe4\xe5\xe6\xe7\xe8\xe9\xea\xeb\xec\xed\xee\xef" 81 "\xf0\xf1\xf2\xf3\xf4\xf5\xf6\xf7\xf8\xf9\xfa\xfb\xfc\xfd\xfe\xff",
83 if (para.size() > 2) value0[0] = para[2];
100 string::const_iterator word_end = para.begin();
102 const string::const_iterator para_end = para.end();
103 while (word_end != para_end) {
104 string::const_iterator word_start;
106 word_end = find_if(word_start, para_end,
C_isspace);
120 for (string::const_iterator i = term.begin(); i != term.end(); ++i) {
124 else if (ch ==
'\\') {
126 if (i != term.end()) {
128 case '\\': ch =
'\\';
break;
129 case '0': ch =
'\0';
break;
130 case 'n': ch =
'\n';
break;
131 case 'r': ch =
'\r';
break;
132 case 't': ch =
'\t';
break;
135 if (
size_t(i - term.begin()) >= term.size() - 2) {
139 string::const_iterator j = i;
160 if (
input.is_open()) {
167 while (file != end && (*file).empty()) {
170 if (file == end)
return;
173 if (!datadir.empty()) {
175 bool need_slash =
true;
177 if (filename.back() == dir_sep) {
182 if (need_slash) filename +=
'/';
187 input.open(filename.c_str());
189 if (!
input.is_open()) {
190 string msg =
"Can't read file '";
192 msg +=
"' for indexing (";
Xapian::docid add_document(const Xapian::Document &document)
Add a new document to the database.
void add_value(Xapian::valueno slot, const std::string &value)
Add a new value.
Class representing a stemming algorithm.
static string munge_term(const string &term)
Convert errno value to std::string, thread-safe if possible.
std::string sortable_serialise(double value)
Convert a floating point number to a string, preserving sort order.
static Xapian::Stem stemmer
static string get_paragraph(istream &input)
Read a paragraph from stream input.
This class provides read/write access to a database.
void errno_to_string(int e, string &s)
void add_posting(const std::string &tname, Xapian::termpos tpos, Xapian::termcount wdfinc=1)
Add an occurrence of a term at a particular position.
unsigned valueno
The number for a value slot in a document.
char hex_decode(char ch1, char ch2)
Decode a pair of ASCII hex digits.
unsigned XAPIAN_TERMPOS_BASE_TYPE termpos
A term position within a document or query.
void index_to(Xapian::WritableDatabase &db)
Various handy helpers which std::string really should provide.
utility functions for indexing testcase data
void set_data(const std::string &data)
Set data stored in the document.
bool C_isnotspace(char ch)
A handle representing a document in a Xapian database.