sourcedoc/html/api__snippets_8cc_source.html

 /* Copyright 2012 Mihai Bivol
  * Copyright 2015,2016,2017,2019,2020 Olly Betts
  *
  * This program is free software; you can redistribute it and/or
  * modify it under the terms of the GNU General Public License as
  * published by the Free Software Foundation; either version 2 of the
  * License, or (at your option) any later version.
  *
  * This program is distributed in the hope that it will be useful,
  * but WITHOUT ANY WARRANTY; without even the implied warranty of
  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
  * GNU General Public License for more details.
  *
  * You should have received a copy of the GNU General Public License
  * along with this program; if not, write to the Free Software
  * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA  02110-1301
  * USA
  */

 #include <config.h>

 #include "api_snippets.h"

 #include <fstream>
 #include <string>

 #include <xapian.h>

 #include "apitest.h"
 #include "testsuite.h"
 #include "testutils.h"

 using namespace std;

 struct snippet_testcase {
     const char * input;
     size_t len;
     const char * expect;
 };

 DEFINE_TESTCASE(snippet1, backend) {
     Xapian::Enquire enquire(get_database("apitest_simpledata"));
     enquire.set_query(Xapian::Query(Xapian::Query::OP_OR,
                                     Xapian::Query("rubbish"),
                                     Xapian::Query("mention")));
     Xapian::MSet mset = enquire.get_mset(0, 0);

     static const snippet_testcase testcases[] = {
         // Test highlighting in full sample.
         { "Rubbish and junk", 20, "<b>Rubbish</b> and junk" },
         { "Project R.U.B.B.I.S.H. greenlit", 31, "Project <b>R.U.B.B.I.S.H.</b> greenlit" },
         { "What a load of rubbish", 100, "What a load of <b>rubbish</b>" },
         { "Mention rubbish", 100, "<b>Mention</b> <b>rubbish</b>" },
         { "A mention of rubbish", 100, "A <b>mention</b> of <b>rubbish</b>" },
         { "Rubbish mention of rubbish", 100, "<b>Rubbish</b> <b>mention</b> of <b>rubbish</b>" },

         // Test selection of snippet.
         { "Rubbish and junk", 12, "<b>Rubbish</b> and..." },
         { "Project R.U.B.B.I.S.H. greenlit", 14, "...<b>R.U.B.B.I.S.H.</b>..." },
         { "What a load of rubbish", 12, "...of <b>rubbish</b>" },
         { "What a load of rubbish", 8, "...<b>rubbish</b>" },
         { "Rubbish mention where the start is better than the rubbish ending", 18, "<b>Rubbish</b> <b>mention</b>..." },

         // Should prefer "interesting" words for context.
         { "And of the rubbish document to this", 18, "...<b>rubbish</b> document..." },
         { "And if they document rubbish to be this", 18, "...document <b>rubbish</b>..." },
     };

     for (auto i : testcases) {
         TEST_STRINGS_EQUAL(mset.snippet(i.input, i.len), i.expect);
     }
 }

 DEFINE_TESTCASE(snippetstem1, backend) {
     Xapian::Enquire enquire(get_database("apitest_simpledata"));
     enquire.set_query(Xapian::Query(Xapian::Query::OP_OR,
                                     Xapian::Query("rubbish"),
                                     Xapian::Query("Zexampl")));
     Xapian::MSet mset = enquire.get_mset(0, 0);

     // Term Zexampl isn't in the database, but the highlighter should still
     // handle it.
     static const snippet_testcase testcases[] = {
         // "rubbish" isn't stemmed, example is.
         { "You rubbished my ideas", 24, "You rubbished my ideas" },
         { "Rubbished all my examples", 20, "...all my <b>examples</b>" },
         { "Examples of text", 20, "<b>Examples</b> of text" },
     };

     Xapian::Stem stem("en");
     for (auto i : testcases) {
         TEST_STRINGS_EQUAL(mset.snippet(i.input, i.len, stem), i.expect);
     }
 }

 DEFINE_TESTCASE(snippetphrase1, backend) {
     Xapian::Enquire enquire(get_database("apitest_simpledata"));
     Xapian::Query q(Xapian::Query::OP_PHRASE,
                     Xapian::Query("rubbish"),
                     Xapian::Query("mention"));
     // Regression test - a phrase with a following sibling query would crash in
     // the highlighting code.
     enquire.set_query(q &~ Xapian::Query("banana"));
     Xapian::MSet mset = enquire.get_mset(0, 0);

     static const snippet_testcase testcases[] = {
         { "A mention of rubbish", 18, "...mention of rubbish" },
         { "This is a rubbish mention", 20, "...is a <b>rubbish mention</b>" },
         { "Mention of a rubbish mention of rubbish", 45, "Mention of a <b>rubbish mention</b> of rubbish" },
         { "Mention of a rubbish mention of rubbish", 18, "...<b>rubbish mention</b> of..." },
         { "rubbish rubbish mention mention", 45, "rubbish <b>rubbish mention</b> mention" },
         { "rubbish mention rubbish mention", 45, "<b>rubbish mention</b> <b>rubbish mention</b>" },
     };

     Xapian::Stem stem("en");
     for (auto i : testcases) {
         TEST_STRINGS_EQUAL(mset.snippet(i.input, i.len, stem), i.expect);
     }
 }

 static void
 make_tg_db(Xapian::WritableDatabase &db, const string & source)
 {
     string file = test_driver::get_srcdir();
     file += "/testdata/";
     file += source;
     file += ".txt";
     ifstream input;
     input.open(file.c_str());
     if (!input.is_open()) {
         FAIL_TEST("Couldn't open input: " << file);
     }

     Xapian::TermGenerator tg;
     tg.set_stemmer(Xapian::Stem("en"));
     while (!input.eof()) {
         Xapian::Document doc;
         tg.set_document(doc);
         string line, data;
         while (true) {
             getline(input, line);
             if (find_if(line.begin(), line.end(), C_isnotspace) == line.end())
                 break;
             tg.index_text(line);
             if (!data.empty()) data += ' ';
             data += line;
         }
         doc.set_data(data);
         db.add_document(doc);
     }
 }

 DEFINE_TESTCASE(snippetmisc1, backend) {
     Xapian::Database db = get_database("snippet", make_tg_db, "snippet");
     Xapian::Enquire enquire(db);
     enquire.set_weighting_scheme(Xapian::BoolWeight());
     Xapian::Stem stem("en");

     static const char * const words[] = { "do", "we", "have" };
     Xapian::Query q(Xapian::Query::OP_PHRASE, words, words + 3);
     enquire.set_query(q);
     Xapian::MSet mset = enquire.get_mset(0, 6);
     TEST_EQUAL(mset.size(), 3);
     TEST_STRINGS_EQUAL(mset.snippet(mset[0].get_document().get_data(), 40, stem),
                        "How much o'brien <b>do we have</b>?  Miles...");
     TEST_STRINGS_EQUAL(mset.snippet(mset[1].get_document().get_data(), 40, stem),
                        "...Unicode: How much o’brien <b>do we have</b>?");
     TEST_STRINGS_EQUAL(mset.snippet(mset[2].get_document().get_data(), 32, stem),
                        "We do have we <b>do we have</b> do we.");

     enquire.set_query(Xapian::Query("Zwelcom") | Xapian::Query("Zmike"));
     mset = enquire.get_mset(0, 6);
     TEST_EQUAL(mset.size(), 3);
     TEST_STRINGS_EQUAL(mset.snippet(mset[0].get_document().get_data(), 25, stem),
                        "\"<b>Welcome</b> to <b>Mike's</b>...");
     TEST_STRINGS_EQUAL(mset.snippet(mset[1].get_document().get_data(), 5, stem),
                        "<b>Mike</b>...");
     TEST_STRINGS_EQUAL(mset.snippet(mset[2].get_document().get_data(), 10, stem),
                        "...<b>Mike</b> can...");

     enquire.set_query(Xapian::Query(q.OP_WILDCARD, "m"));
     mset = enquire.get_mset(0, 6);
     TEST_EQUAL(mset.size(), 5);
     TEST_STRINGS_EQUAL(mset.snippet(mset[0].get_document().get_data(), 18, stem),
                        "...<b>Mike's</b> <b>Mechanical</b>...");
     TEST_STRINGS_EQUAL(mset.snippet(mset[1].get_document().get_data(), 80, stem),
                        "<b>Mike</b> <b>McDonald</b> is a <b>mechanic</b> who enjoys repairing things of a <b>mechanical</b> sort.");
     TEST_STRINGS_EQUAL(mset.snippet(mset[2].get_document().get_data(), 102, stem),
                        "From autos to zip-lines, from tea-lights to x-rays, from sea ships to u-boats - <b>Mike</b> can fix them all.");
     TEST_STRINGS_EQUAL(mset.snippet(mset[3].get_document().get_data(), 64, stem),
                        "How <b>much</b> o'brien do we have?  <b>Miles</b> O'Brien, that's how <b>much</b>.");
     // The requested length is in bytes, so the "fancy" apostrophe results in
     // fewer Unicode characters in this sample than the previous one.
     TEST_STRINGS_EQUAL(mset.snippet(mset[4].get_document().get_data(), 64, stem),
                        "...<b>much</b> o’brien do we have?  <b>Miles</b> O’Brien, that’s how <b>much</b>.");
 }

 DEFINE_TESTCASE(snippet_termcover1, backend) {
     static const snippet_testcase testcases[] = {
         // "Zexample" isn't in the database, so should get termweight 0.  Once
         // max_tw is added on, "rubbish" should have just under twice the
         // relevance of "example" so clearly should win in a straight fight.
         { "A rubbish, but a good example", 14, "...<b>rubbish</b>, but a..."},
         // But a second occurrence of "rubbish" has half the relevance, so
         // "example" should add slightly more relevance.
         { "Rubbish and rubbish, and rubbish examples", 22, "...and <b>rubbish</b> <b>examples</b>"},
         // And again.
         { "rubbish rubbish example rubbish rubbish", 16, "...<b>example</b> <b>rubbish</b>..." },
     };

     Xapian::Stem stem("en");
     // Disable SNIPPET_BACKGROUND_MODEL so we can test the relevance decay
     // for repeated terms.
     unsigned flags = Xapian::MSet::SNIPPET_EXHAUSTIVE;
     for (auto i : testcases) {
         Xapian::Enquire enquire(get_database("apitest_simpledata"));
         enquire.set_query(Xapian::Query(Xapian::Query::OP_OR,
                     Xapian::Query("rubbish"),
                     Xapian::Query("Zexampl")));

         Xapian::MSet mset = enquire.get_mset(0, 0);
         TEST_STRINGS_EQUAL(mset.snippet(i.input, i.len, stem, flags), i.expect);
     }
 }

 DEFINE_TESTCASE(snippet_termcover2, backend) {
     // With BoolWeight, all terms have 0 termweight, and so relevance 1.0
     // (since max_tw is set to 1.0 if it is zero).
     static const snippet_testcase testcases[] = {
         // Diversity should pick two different terms in preference.
         { "rubbish rubbish example rubbish rubbish", 16, "...<b>example</b> <b>rubbish</b>..." },
         // And again.
         { "Rubbish and rubbish, and rubbish examples", 22, "...and <b>rubbish</b> <b>examples</b>"},
         // The last of two equal snippet should win.
         { "A rubbish, but a good example", 14, "...a good <b>example</b>"},
     };

     Xapian::Stem stem("en");
     // Disable SNIPPET_BACKGROUND_MODEL so we can test the relevance decay
     // for repeated terms.
     unsigned flags = Xapian::MSet::SNIPPET_EXHAUSTIVE;
     for (auto i : testcases) {
         Xapian::Enquire enquire(get_database("apitest_simpledata"));
         enquire.set_query(Xapian::Query(Xapian::Query::OP_OR,
                     Xapian::Query("rubbish"),
                     Xapian::Query("Zexampl")));
         enquire.set_weighting_scheme(Xapian::BoolWeight());

         Xapian::MSet mset = enquire.get_mset(0, 0);
         TEST_STRINGS_EQUAL(mset.snippet(i.input, i.len, stem, flags), i.expect);
     }
 }

 DEFINE_TESTCASE(snippet_empty, backend) {
     Xapian::Stem stem("en");

     Xapian::Enquire enquire(get_database("apitest_simpledata"));
     enquire.set_query(Xapian::Query(Xapian::Query::OP_OR,
                       Xapian::Query("rubbish"),
                       Xapian::Query("Zexampl")));

     Xapian::MSet mset = enquire.get_mset(0, 0);

     // A non-matching text
     const char *input = "A string without a match.";
     size_t len = strlen(input);

     // By default, snippet() returns len bytes of input without markup
     unsigned flags = 0;
     TEST_STRINGS_EQUAL(mset.snippet(input, len, stem, 0), input);

     // force snippet() to return the empty string if no term got matched
     flags |= Xapian::MSet::SNIPPET_EMPTY_WITHOUT_MATCH;
     TEST_STRINGS_EQUAL(mset.snippet(input, len, stem, flags), "");

     // A text with a match
     input = "A rubbish example text";
     len = strlen(input);

     flags = 0;
     TEST_STRINGS_EQUAL(mset.snippet(input, len, stem, flags),
                        "A <b>rubbish</b> <b>example</b> text");

     flags |= Xapian::MSet::SNIPPET_EMPTY_WITHOUT_MATCH;
     TEST_STRINGS_EQUAL(mset.snippet(input, len, stem, flags),
                        "A <b>rubbish</b> <b>example</b> text");
 }

 DEFINE_TESTCASE(snippet_start_nonspace, backend) {
     Xapian::Enquire enquire(get_database("apitest_simpledata"));
     enquire.set_query(Xapian::Query("foo") | Xapian::Query("10"));

     Xapian::MSet mset = enquire.get_mset(0, 0);

     Xapian::Stem stem;

     const char *input = "[xapian-devel] Re: foo";
     TEST_STRINGS_EQUAL(mset.snippet(input, strlen(input), stem),
                        "[xapian-devel] Re: <b>foo</b>");

     input = "bar [xapian-devel] Re: foo";
     TEST_STRINGS_EQUAL(mset.snippet(input, 24, stem),
                        "...[xapian-devel] Re: <b>foo</b>");

     input = "there is a $1000 prize for foo";
     TEST_STRINGS_EQUAL(mset.snippet(input, 20, stem),
                        "...$1000 prize for <b>foo</b>");

     input = "-1 is less than foo";
     TEST_STRINGS_EQUAL(mset.snippet(input, strlen(input), stem),
                        "-1 is less than <b>foo</b>");

     input = "+1 is less than foo";
     TEST_STRINGS_EQUAL(mset.snippet(input, strlen(input), stem),
                        "+1 is less than <b>foo</b>");

     input = "/bin/sh is a foo";
     TEST_STRINGS_EQUAL(mset.snippet(input, strlen(input), stem),
                        "/bin/sh is a <b>foo</b>");

     input = "'tis pity foo is a bar";
     TEST_STRINGS_EQUAL(mset.snippet(input, strlen(input), stem),
                        "'tis pity <b>foo</b> is a bar");

     input = "\"foo bar\" he whispered";
     TEST_STRINGS_EQUAL(mset.snippet(input, 11, stem),
                        "\"<b>foo</b> bar\" he...");

     input = "\\\\server\\share\\foo is a UNC path";
     TEST_STRINGS_EQUAL(mset.snippet(input, strlen(input), stem),
                        "\\\\server\\share\\<b>foo</b> is a UNC path");

     input = "«foo» is a placeholder";
     TEST_STRINGS_EQUAL(mset.snippet(input, 9, stem),
                        "«<b>foo</b>» is...");

     input = "#include <foo.h> to use libfoo";
     TEST_STRINGS_EQUAL(mset.snippet(input, 12, stem),
                        "...&lt;<b>foo</b>.h&gt; to...");

     input = "¡foo!";
     TEST_STRINGS_EQUAL(mset.snippet(input, strlen(input), stem),
                        "¡<b>foo</b>!");

     input = "¿foo?";
     TEST_STRINGS_EQUAL(mset.snippet(input, strlen(input), stem),
                        "¿<b>foo</b>?");

     input = "(foo) test";
     TEST_STRINGS_EQUAL(mset.snippet(input, strlen(input), stem),
                        "(<b>foo</b>) test");

     input = "{foo} test";
     TEST_STRINGS_EQUAL(mset.snippet(input, strlen(input), stem),
                        "{<b>foo</b>} test");

     input = "`foo` test";
     TEST_STRINGS_EQUAL(mset.snippet(input, strlen(input), stem),
                        "`<b>foo</b>` test");

     input = "@foo@ is replaced";
     TEST_STRINGS_EQUAL(mset.snippet(input, strlen(input), stem),
                        "@<b>foo</b>@ is replaced");

     input = "%foo is a perl hash";
     TEST_STRINGS_EQUAL(mset.snippet(input, strlen(input), stem),
                        "%<b>foo</b> is a perl hash");

     input = "&foo takes the address of foo";
     TEST_STRINGS_EQUAL(mset.snippet(input, strlen(input), stem),
                        "&amp;<b>foo</b> takes the address of <b>foo</b>");

     input = "§3.1.4 foo";
     TEST_STRINGS_EQUAL(mset.snippet(input, strlen(input), stem),
                        "§3.1.4 <b>foo</b>");

     input = "#foo";
     TEST_STRINGS_EQUAL(mset.snippet(input, strlen(input), stem),
                        "#<b>foo</b>");

     input = "~foo~ test";
     TEST_STRINGS_EQUAL(mset.snippet(input, strlen(input), stem),
                        "~<b>foo</b>~ test");

     input = "( foo )";
     TEST_STRINGS_EQUAL(mset.snippet(input, strlen(input), stem),
                        "<b>foo</b>...");

     input = "(=foo=)";
     TEST_STRINGS_EQUAL(mset.snippet(input, strlen(input), stem),
                        "<b>foo</b>...");

     // Check that excessive non-word characters aren't included.
     input = "((((((foo";
     TEST_STRINGS_EQUAL(mset.snippet(input, strlen(input), stem),
                        "<b>foo</b>");

     // Check we don't include characters that aren't useful.
     input = "bar,foo!";
     TEST_STRINGS_EQUAL(mset.snippet(input, 5, stem),
                        "...<b>foo</b>!");

     // Check trailing characters are included when useful.
     input = "/opt/foo/bin/";
     TEST_STRINGS_EQUAL(mset.snippet(input, strlen(input), stem),
                        "/opt/<b>foo</b>/bin/");

     input = "\"foo bar\"";
     TEST_STRINGS_EQUAL(mset.snippet(input, strlen(input), stem),
                        "\"<b>foo</b> bar\"");

     input = "\\\\server\\share\\foo\\";
     TEST_STRINGS_EQUAL(mset.snippet(input, strlen(input), stem),
                        "\\\\server\\share\\<b>foo</b>\\");

     input = "«foo»";
     TEST_STRINGS_EQUAL(mset.snippet(input, strlen(input), stem),
                        "«<b>foo</b>»");

     input = "#include <foo>";
     TEST_STRINGS_EQUAL(mset.snippet(input, strlen(input), stem),
                        "#include &lt;<b>foo</b>&gt;");

     input = "(foo)";
     TEST_STRINGS_EQUAL(mset.snippet(input, strlen(input), stem),
                        "(<b>foo</b>)");

     input = "{foo}";
     TEST_STRINGS_EQUAL(mset.snippet(input, strlen(input), stem),
                        "{<b>foo</b>}");

     input = "[foo]";
     TEST_STRINGS_EQUAL(mset.snippet(input, strlen(input), stem),
                        "[<b>foo</b>]");

     input = "`foo`";
     TEST_STRINGS_EQUAL(mset.snippet(input, strlen(input), stem),
                        "`<b>foo</b>`");

     input = "@foo@";
     TEST_STRINGS_EQUAL(mset.snippet(input, strlen(input), stem),
                        "@<b>foo</b>@");

     input = "foo for 10¢";
     TEST_STRINGS_EQUAL(mset.snippet(input, strlen(input), stem),
                        "<b>foo</b> for <b>10</b>¢");
 }

 DEFINE_TESTCASE(snippet_small_zerolength, backend) {
     Xapian::Enquire enquire(get_database("apitest_simpledata"));
     enquire.set_query(Xapian::Query(Xapian::Query::OP_OR,
                                     Xapian::Query("rubbish"),
                                     Xapian::Query("mention")));
     Xapian::MSet mset = enquire.get_mset(0, 0);

     static const snippet_testcase testcases[] = {
         // Test with small length
         { "mention junk rubbish", 3, "" },
         { "Project R.U.B.B.I.S.H. greenlit", 5, "" },
         { "What load rubbish", 3, "" },
         { "Mention rubbish", 4, "" },

         // Test with zero length.
         { "Rubbish and junk", 0, "" },
         { "Project R.U.B.B.I.S.H. greenlit", 0, "" },
         { "What a load of rubbish", 0, "" },
         { "rubbish mention rubbish mention", 0, "" },
     };

     for (auto i : testcases) {
         TEST_STRINGS_EQUAL(mset.snippet(i.input, i.len), i.expect);
     }
 }

 DEFINE_TESTCASE(snippet_ngrams, backend) {
     Xapian::Database db = get_database("snippet_ngrams",
         [](Xapian::WritableDatabase& wdb,
            const string&)
         {
             Xapian::Document doc;
             Xapian::TermGenerator tg;
             tg.set_flags(Xapian::TermGenerator::FLAG_NGRAMS);
             tg.set_document(doc);
             tg.index_text("明末時已經有香港地方的概念");
             wdb.add_document(doc);
         });
     Xapian::Enquire enquire(db);
     Xapian::QueryParser qp;
     auto q = qp.parse_query("已經完成", qp.FLAG_DEFAULT | qp.FLAG_NGRAMS);
     enquire.set_query(q);

     Xapian::MSet mset = enquire.get_mset(0, 0);

     Xapian::Stem stem;
     const char *input = "明末時已經有香港地方的概念";
     size_t len = strlen(input);

     unsigned flags = Xapian::MSet::SNIPPET_NGRAMS;
     string s;
     s = mset.snippet(input, len, stem, flags, "<b>", "</b>", "...");
     TEST_STRINGS_EQUAL(s, "明末時<b>已</b><b>經</b>有香港地方的概念");

     s = mset.snippet(input, len / 2, stem, flags, "<b>", "</b>", "...");
     TEST_STRINGS_EQUAL(s, "...<b>已</b><b>經</b>有香港地...");
 }

 DEFINE_TESTCASE(snippet_empty_mset, backend) {
     Xapian::Enquire enquire(get_database("apitest_simpledata"));
     enquire.set_query(Xapian::Query());
     Xapian::MSet mset = enquire.get_mset(0, 0);
     TEST_STRINGS_EQUAL(mset.snippet("foo", 3), "foo");
 }

 DEFINE_TESTCASE(snippet_empty_mset2, !backend) {
     Xapian::MSet mset;
     TEST_STRINGS_EQUAL(mset.snippet("foo", 3), "foo");
 }
Xapian::MSet::size
Xapian::doccount size() const
Return number of items in this MSet object.
Definition: omenquire.cc:318

Xapian::WritableDatabase::add_document
Xapian::docid add_document(const Xapian::Document &document)
Add a new document to the database.
Definition: omdatabase.cc:902

Xapian::Query::OP_WILDCARD
Wildcard expansion.
Definition: query.h:255

Xapian::MSet::SNIPPET_NGRAMS
Generate n-grams for scripts without explicit word breaks.
Definition: mset.h:211

Xapian::MSet::SNIPPET_EXHAUSTIVE
Exhaustively evaluate candidate snippets in MSet::snippet().
Definition: mset.h:179

Xapian::QueryParser::FLAG_DEFAULT
The default flags.
Definition: queryparser.h:939

make_tg_db
static void make_tg_db(Xapian::WritableDatabase &db, const string &source)
Index file to a DB with TermGenerator.
Definition: api_snippets.cc:129

Xapian::Database
This class is used to access a database, or a group of databases.
Definition: database.h:68

Xapian::Stem
Class representing a stemming algorithm.
Definition: stem.h:62

Xapian::TermGenerator::set_document
void set_document(const Xapian::Document &doc)
Set the current document.
Definition: termgenerator.cc:64

Xapian::TermGenerator
Parses a piece of text and generate terms.
Definition: termgenerator.h:48

input
Definition: header.h:63

Xapian::MSet::snippet
std::string snippet(const std::string &text, size_t length=500, const Xapian::Stem &stemmer=Xapian::Stem(), unsigned flags=SNIPPET_BACKGROUND_MODEL|SNIPPET_EXHAUSTIVE, const std::string &hi_start="<b>", const std::string &hi_end="</b>", const std::string &omit="...") const
Generate a snippet.
Definition: omenquire.cc:304

snippet_testcase::expect
const char * expect
Definition: api_snippets.cc:41

Xapian::QueryParser
Build a Xapian::Query object from a user query string.
Definition: queryparser.h:778

testsuite.h
a generic test suite engine

Xapian::MSet
Class representing a list of search results.
Definition: mset.h:44

config.h

std
STL namespace.

Xapian::Enquire::get_mset
MSet get_mset(Xapian::doccount first, Xapian::doccount maxitems, Xapian::doccount checkatleast=0, const RSet *omrset=0, const MatchDecider *mdecider=0) const
Get (a portion of) the match set for the current query.
Definition: omenquire.cc:938

test_driver::get_srcdir
static std::string get_srcdir()
Read srcdir from environment and if not present, make a valiant attempt to guess a value...
Definition: testsuite.cc:129

snippet_testcase::len
size_t len
Definition: api_snippets.cc:40

Xapian::TermGenerator::FLAG_NGRAMS
Generate n-grams for scripts without explicit word breaks.
Definition: termgenerator.h:127

Xapian::TermGenerator::index_text
void index_text(const Xapian::Utf8Iterator &itor, Xapian::termcount wdf_inc=1, const std::string &prefix=std::string())
Index some text.
Definition: termgenerator.cc:109

apitest.h
test functionality of the Xapian API

Xapian::BoolWeight
Class implementing a "boolean" weighting scheme.
Definition: weight.h:433

Xapian::WritableDatabase
This class provides read/write access to a database.
Definition: database.h:789

Xapian::Query::OP_PHRASE
Match only documents where all subqueries match near and in order.
Definition: query.h:152

xapian.h
Public interfaces for the Xapian library.

snippet_testcase
Definition: api_snippets.cc:38

Xapian::TermGenerator::set_stemmer
void set_stemmer(const Xapian::Stem &stemmer)
Set the Xapian::Stem object to be used for generating stemmed terms.
Definition: termgenerator.cc:52

DEFINE_TESTCASE
DEFINE_TESTCASE(snippet1, backend)
Test snippets without stemming.
Definition: api_snippets.cc:45

Xapian::QueryParser::parse_query
Query parse_query(const std::string &query_string, unsigned flags=FLAG_DEFAULT, const std::string &default_prefix=std::string())
Parse a query.
Definition: queryparser.cc:162

Xapian::Enquire::set_query
void set_query(const Xapian::Query &query, Xapian::termcount qlen=0)
Set the query to run.
Definition: omenquire.cc:793

FAIL_TEST
#define FAIL_TEST(MSG)
Fail the current testcase with message MSG.
Definition: testsuite.h:68

snippet_testcase::input
const char * input
Definition: api_snippets.cc:39

get_database
Xapian::Database get_database(const string &dbname)
Definition: apitest.cc:48

api_snippets.h

Xapian::TermGenerator::set_flags
flags set_flags(flags toggle, flags mask=flags(0))
Set flags.
Definition: termgenerator.cc:83

Xapian::Enquire
This class provides an interface to the information retrieval system for the purpose of searching...
Definition: enquire.h:152

Xapian::Query::OP_OR
Match documents which at least one subquery matches.
Definition: query.h:92

testutils.h
Xapian-specific test helper functions and macros.

TEST_STRINGS_EQUAL
#define TEST_STRINGS_EQUAL(a, b)
Test for equality of two strings.
Definition: testsuite.h:287

Xapian::MSet::SNIPPET_EMPTY_WITHOUT_MATCH
Return the empty string if no term got matched.
Definition: mset.h:186

Xapian::Enquire::set_weighting_scheme
void set_weighting_scheme(const Weight &weight_)
Set the weighting scheme to use for queries.
Definition: omenquire.cc:819

Xapian::Query
Class representing a query.
Definition: query.h:46

TEST_EQUAL
#define TEST_EQUAL(a, b)
Test for equality of two things.
Definition: testsuite.h:278

Xapian::Document::set_data
void set_data(const std::string &data)
Set data stored in the document.
Definition: omdocument.cc:78

C_isnotspace
bool C_isnotspace(char ch)
Definition: stringutils.h:219

Xapian::QueryParser::FLAG_NGRAMS
Generate n-grams for scripts without explicit word breaks.
Definition: queryparser.h:895

Xapian::Document
A handle representing a document in a Xapian database.
Definition: document.h:61

testcases
static const testcase testcases[]
Definition: api_unicode.cc:39