Lucene++ - a full-featured, c++ search engine
API Documentation


 All Data Structures Namespaces Files Functions Variables Typedefs Enumerations Enumerator Macros Pages
KeywordTokenizer.h
Go to the documentation of this file.
1 // Copyright (c) 2009-2014 Alan Wright. All rights reserved.
3 // Distributable under the terms of either the Apache License (Version 2.0)
4 // or the GNU Lesser General Public License.
6 
7 #ifndef KEYWORDTOKENIZER_H
8 #define KEYWORDTOKENIZER_H
9 
10 #include "Tokenizer.h"
11 
12 namespace Lucene {
13 
15 class LPPAPI KeywordTokenizer : public Tokenizer {
16 public:
17  KeywordTokenizer(const ReaderPtr& input);
18  KeywordTokenizer(const ReaderPtr& input, int32_t bufferSize);
19  KeywordTokenizer(const AttributeSourcePtr& source, const ReaderPtr& input, int32_t bufferSize);
20  KeywordTokenizer(const AttributeFactoryPtr& factory, const ReaderPtr& input, int32_t bufferSize);
21 
22  virtual ~KeywordTokenizer();
23 
25 
26 protected:
27  static const int32_t DEFAULT_BUFFER_SIZE;
28 
29  bool done;
30  int32_t finalOffset;
33 
34 protected:
35  void init(int32_t bufferSize);
36 
37 public:
38  virtual bool incrementToken();
39  virtual void end();
40  virtual void reset();
41 };
42 
43 }
44 
45 #endif
TermAttributePtr termAtt
Definition: KeywordTokenizer.h:31
boost::shared_ptr< Reader > ReaderPtr
Definition: LuceneTypes.h:547
boost::shared_ptr< AttributeFactory > AttributeFactoryPtr
Definition: LuceneTypes.h:519
boost::shared_ptr< AttributeSource > AttributeSourcePtr
Definition: LuceneTypes.h:520
boost::shared_ptr< TermAttribute > TermAttributePtr
Definition: LuceneTypes.h:58
int32_t finalOffset
Definition: KeywordTokenizer.h:30
#define LUCENE_CLASS(Name)
Definition: LuceneObject.h:24
Definition: AbstractAllTermDocs.h:12
boost::shared_ptr< OffsetAttribute > OffsetAttributePtr
Definition: LuceneTypes.h:40
bool done
Definition: KeywordTokenizer.h:29
A Tokenizer is a TokenStream whose input is a Reader.
Definition: Tokenizer.h:20
Emits the entire input as a single token.
Definition: KeywordTokenizer.h:15
OffsetAttributePtr offsetAtt
Definition: KeywordTokenizer.h:32

clucene.sourceforge.net