Lucene++ - a full-featured, c++ search engine
API Documentation


Loading...
Searching...
No Matches
KeywordTokenizer.h
Go to the documentation of this file.
1
2// Copyright (c) 2009-2014 Alan Wright. All rights reserved.
3// Distributable under the terms of either the Apache License (Version 2.0)
4// or the GNU Lesser General Public License.
6
7#ifndef KEYWORDTOKENIZER_H
8#define KEYWORDTOKENIZER_H
9
10#include "Tokenizer.h"
11
12namespace Lucene {
13
15class LPPAPI KeywordTokenizer : public Tokenizer {
16public:
18 KeywordTokenizer(const ReaderPtr& input, int32_t bufferSize);
19 KeywordTokenizer(const AttributeSourcePtr& source, const ReaderPtr& input, int32_t bufferSize);
20 KeywordTokenizer(const AttributeFactoryPtr& factory, const ReaderPtr& input, int32_t bufferSize);
21
23
25
26protected:
27 static const int32_t DEFAULT_BUFFER_SIZE;
28
29 bool done;
30 int32_t finalOffset;
33
34protected:
35 void init(int32_t bufferSize);
36
37public:
38 virtual bool incrementToken();
39 virtual void end();
40 virtual void reset();
41};
42
43}
44
45#endif
#define LUCENE_CLASS(Name)
Definition LuceneObject.h:24
Emits the entire input as a single token.
Definition KeywordTokenizer.h:15
OffsetAttributePtr offsetAtt
Definition KeywordTokenizer.h:32
void init(int32_t bufferSize)
virtual bool incrementToken()
Consumers (ie., IndexWriter) use this method to advance the stream to the next token....
bool done
Definition KeywordTokenizer.h:29
KeywordTokenizer(const ReaderPtr &input)
KeywordTokenizer(const AttributeFactoryPtr &factory, const ReaderPtr &input, int32_t bufferSize)
virtual void reset()
Resets this stream to the beginning. This is an optional operation, so subclasses may or may not impl...
TermAttributePtr termAtt
Definition KeywordTokenizer.h:31
static const int32_t DEFAULT_BUFFER_SIZE
Definition KeywordTokenizer.h:27
KeywordTokenizer(const ReaderPtr &input, int32_t bufferSize)
int32_t finalOffset
Definition KeywordTokenizer.h:30
KeywordTokenizer(const AttributeSourcePtr &source, const ReaderPtr &input, int32_t bufferSize)
virtual void end()
This method is called by the consumer after the last token has been consumed, after incrementToken() ...
A Tokenizer is a TokenStream whose input is a Reader.
Definition Tokenizer.h:20
Definition AbstractAllTermDocs.h:12
boost::shared_ptr< AttributeSource > AttributeSourcePtr
Definition LuceneTypes.h:520
boost::shared_ptr< TermAttribute > TermAttributePtr
Definition LuceneTypes.h:58
boost::shared_ptr< OffsetAttribute > OffsetAttributePtr
Definition LuceneTypes.h:40
boost::shared_ptr< Reader > ReaderPtr
Definition LuceneTypes.h:547
boost::shared_ptr< AttributeFactory > AttributeFactoryPtr
Definition LuceneTypes.h:519

clucene.sourceforge.net