CharStream adds correctOffset
functionality over Reader
. All Tokenizers accept a CharStream instead of Reader
as input, which enables arbitrary character based filtering before tokenization. The correctOffset
method fixed offsets to account for removal or insertion of characters, so that the offsets reported in the tokens match the character offsets of the original Reader.
More...
#include <CharStream.h>
|
virtual | ~CharStream () |
|
virtual String | getClassName () |
|
boost::shared_ptr< CharStream > | shared_from_this () |
|
virtual int32_t | correctOffset (int32_t currentOff)=0 |
| Called by CharFilter(s) and Tokenizer to correct token offset.
|
|
virtual | ~Reader () |
|
boost::shared_ptr< Reader > | shared_from_this () |
|
virtual int32_t | read () |
| Read a single character.
|
|
virtual int32_t | read (wchar_t *buffer, int32_t offset, int32_t length)=0 |
| Read characters into a portion of an array.
|
|
virtual int64_t | skip (int64_t n) |
| Skip characters.
|
|
virtual void | close ()=0 |
| Close the stream.
|
|
virtual bool | markSupported () |
| Tell whether this stream supports the mark() operation.
|
|
virtual void | mark (int32_t readAheadLimit) |
| Mark the present position in the stream. Subsequent calls to reset() will attempt to reposition the stream to this point.
|
|
virtual void | reset () |
| Reset the stream. If the stream has been marked, then attempt to reposition it at the mark. If the stream has not been marked, then attempt to reset it in some way appropriate to the particular stream, for example by repositioning it to its starting point.
|
|
virtual int64_t | length () |
| The number of bytes in the stream.
|
|
virtual | ~LuceneObject () |
|
virtual void | initialize () |
| Called directly after instantiation to create objects that depend on this object being fully constructed.
|
|
virtual LuceneObjectPtr | clone (const LuceneObjectPtr &other=LuceneObjectPtr()) |
| Return clone of this object.
|
|
virtual int32_t | hashCode () |
| Return hash code for this object.
|
|
virtual bool | equals (const LuceneObjectPtr &other) |
| Return whether two objects are equal.
|
|
virtual int32_t | compareTo (const LuceneObjectPtr &other) |
| Compare two objects.
|
|
virtual String | toString () |
| Returns a string representation of the object.
|
|
virtual | ~LuceneSync () |
|
virtual SynchronizePtr | getSync () |
| Return this object synchronize lock.
|
|
virtual LuceneSignalPtr | getSignal () |
| Return this object signal.
|
|
virtual void | lock (int32_t timeout=0) |
| Lock this object using an optional timeout.
|
|
virtual void | unlock () |
| Unlock this object.
|
|
virtual bool | holdsLock () |
| Returns true if this object is currently locked by current thread.
|
|
virtual void | wait (int32_t timeout=0) |
| Wait for signal using an optional timeout.
|
|
virtual void | notifyAll () |
| Notify all threads waiting for signal.
|
|
CharStream adds correctOffset
functionality over Reader
. All Tokenizers accept a CharStream instead of Reader
as input, which enables arbitrary character based filtering before tokenization. The correctOffset
method fixed offsets to account for removal or insertion of characters, so that the offsets reported in the tokens match the character offsets of the original Reader.
◆ ~CharStream()
virtual Lucene::CharStream::~CharStream |
( |
| ) |
|
|
virtual |
◆ _getClassName()
static String Lucene::CharStream::_getClassName |
( |
| ) |
|
|
inlinestatic |
◆ correctOffset()
virtual int32_t Lucene::CharStream::correctOffset |
( |
int32_t |
currentOff | ) |
|
|
pure virtual |
◆ getClassName()
virtual String Lucene::CharStream::getClassName |
( |
| ) |
|
|
inlinevirtual |
◆ shared_from_this()
boost::shared_ptr< CharStream > Lucene::CharStream::shared_from_this |
( |
| ) |
|
|
inline |
The documentation for this class was generated from the following file: