Lucene++ - a full-featured, c++ search engine
API Documentation
Go to the documentation of this file.
56 int32_t
encode(uint8_t* utf8, int32_t length);
58 int32_t
utf16to8(uint8_t* utf8, int32_t length);
59 int32_t
utf32to8(uint8_t* utf8, int32_t length);
93 int32_t
decode(
wchar_t* unicode, int32_t length);
95 int32_t
utf8to16(
wchar_t* unicode, int32_t length);
96 int32_t
utf8to32(
wchar_t* unicode, int32_t length);
132 int32_t
decode(
wchar_t* unicode, int32_t length);
static const uint16_t TRAIL_SURROGATE_MIN
Definition: UTF8Stream.h:22
ReaderPtr reader
Definition: UTF8Stream.h:72
int32_t utf16to16(wchar_t *unicode, int32_t length)
const uint8_t * utf8Begin
Definition: UTF8Stream.h:86
#define LUCENE_CLASS(Name)
Definition: LuceneObject.h:24
Definition: UTF8Stream.h:106
static const uint32_t SURROGATE_OFFSET
Definition: UTF8Stream.h:25
bool isOverlongSequence(uint32_t cp, int32_t length)
const wchar_t * unicodeBegin
Definition: UTF8Stream.h:49
virtual uint32_t readNext()
int32_t sequenceLength(uint32_t cp)
boost::shared_ptr< Reader > ReaderPtr
Definition: LuceneTypes.h:547
static const uint32_t CODE_POINT_MAX
Definition: UTF8Stream.h:26
int32_t utf8to32(wchar_t *unicode, int32_t length)
ReaderPtr reader
Definition: UTF8Stream.h:111
uint8_t * appendChar(uint8_t *utf8, uint32_t cp)
int32_t utf16to8(uint8_t *utf8, int32_t length)
virtual uint32_t readNext()
Definition: AbstractAllTermDocs.h:12
bool isValidNext(uint32_t &cp)
bool isSurrogate(uint32_t cp)
Base class for all Lucene classes.
Definition: LuceneObject.h:31
virtual uint32_t readNext()
const uint16_t * utf16End
Definition: UTF8Stream.h:129
bool isLeadSurrogate(uint32_t cp)
static const wchar_t UNICODE_REPLACEMENT_CHAR
Definition: UTF8Stream.h:28
virtual uint32_t readNext()=0
bool getSequence(uint32_t &cp, int32_t length)
uint8_t mask8(uint32_t b)
static const wchar_t UNICODE_TERMINATOR
Definition: UTF8Stream.h:29
static const uint16_t LEAD_SURROGATE_MIN
Definition: UTF8Stream.h:17
UTF16Decoder(const uint16_t *utf16Begin, const uint16_t *utf16End)
int32_t utf32to8(uint8_t *utf8, int32_t length)
UTF8EncoderStream(const ReaderPtr &reader)
int32_t utf16to32(wchar_t *unicode, int32_t length)
UTF8DecoderStream(const ReaderPtr &reader)
virtual ~UTF8EncoderStream()
static const uint16_t LEAD_OFFSET
Definition: UTF8Stream.h:24
int32_t encode(uint8_t *utf8, int32_t length)
Definition: UTF8Stream.h:81
const uint8_t * utf8End
Definition: UTF8Stream.h:90
virtual ~UTF8DecoderStream()
virtual uint32_t readNext()
Definition: UTF8Stream.h:67
static const uint16_t LEAD_SURROGATE_MAX
Definition: UTF8Stream.h:21
int32_t utf8to16(wchar_t *unicode, int32_t length)
Definition: UTF8Stream.h:44
const uint16_t * utf16Begin
Definition: UTF8Stream.h:125
virtual uint32_t readNext()
static const uint16_t TRAIL_SURROGATE_MAX
Definition: UTF8Stream.h:23
uint16_t mask16(uint32_t c)
const wchar_t * unicodeEnd
Definition: UTF8Stream.h:53
UTF8Encoder(const wchar_t *unicodeBegin, const wchar_t *unicodeEnd)
Definition: UTF8Stream.h:14
bool isTrailSurrogate(uint32_t cp)
int32_t decode(wchar_t *unicode, int32_t length)
bool isValidCodePoint(uint32_t cp)
UTF8Decoder(const uint8_t *utf8Begin, const uint8_t *utf8End)
Definition: UTF8Stream.h:120
int32_t decode(wchar_t *unicode, int32_t length)
clucene.sourceforge.net