28 #ifndef XAPIAN_INCLUDED_WORD_BREAKER_H
29 #define XAPIAN_INCLUDED_WORD_BREAKER_H
32 # error config.h must be included first in each C++ source file
95 return !(*
this == other);
Iterator returning unigrams and bigrams.
NgramIterator & operator++()
bool operator!=(const NgramIterator &other) const
NgramIterator(const std::string &s)
const std::string & operator*() const
bool unigram() const
Is this a unigram?
const Xapian::Utf8Iterator & get_utf8iterator() const
unsigned offset
Offset to penultimate Unicode character in current_token.
std::string current_token
bool operator==(const NgramIterator &other) const
void init()
Call to set current_token at the start.
NgramIterator(const Xapian::Utf8Iterator &it_)
An iterator which returns Unicode character values from a UTF-8 encoded string.
Unicode and UTF-8 related classes and functions.
void get_unbroken(Xapian::Utf8Iterator &it)
bool is_unbroken_script(unsigned codepoint)
bool is_ngram_enabled()
Should we use the n-gram code?