strusAnalyzer  0.17
posTaggerInstanceInterface.hpp
Go to the documentation of this file.
1 /*
2  * Copyright (c) 2018 Patrick P. Frey
3  *
4  * This Source Code Form is subject to the terms of the Mozilla Public
5  * License, v. 2.0. If a copy of the MPL was not distributed with this
6  * file, You can obtain one at http://mozilla.org/MPL/2.0/.
7  */
10 #ifndef _STRUS_ANALYZER_POS_TAGGER_INSTANCE_INTERFACE_HPP_INCLUDED
11 #define _STRUS_ANALYZER_POS_TAGGER_INSTANCE_INTERFACE_HPP_INCLUDED
13 #include <string>
14 
16 namespace strus
17 {
18 
20 class PosTaggerDataInterface;
21 
24 {
25 public:
28 
31  virtual void addContentExpression( const std::string& expression)=0;
32 
37  virtual void addPosTaggerInputPunctuation( const std::string& expression, const std::string& punct, int priority)=0;
38 
42  virtual std::string getPosTaggerInput( const analyzer::DocumentClass& dclass, const std::string& content) const=0;
43 
49  virtual std::string markupDocument( const PosTaggerDataInterface* data, int docno, const analyzer::DocumentClass& dclass, const std::string& content) const=0;
50 };
51 
52 }//namespace
53 #endif
54 
virtual std::string markupDocument(const PosTaggerDataInterface *data, int docno, const analyzer::DocumentClass &dclass, const std::string &content) const =0
Markup a document with POS tagging info.
virtual std::string getPosTaggerInput(const analyzer::DocumentClass &dclass, const std::string &content) const =0
Map a document to a text string as input of POS tagging.
Defines a description of the properties of an original document processed by the segmenter.
Definition: documentClass.hpp:21
Structure describing the MIME type plus some attributes that could be relevant for analysis of a docu...
virtual void addPosTaggerInputPunctuation(const std::string &expression, const std::string &punct, int priority)=0
Defines a punktuation marker for POS tagger input.
Interface for the data built by a POS tagger.
Definition: posTaggerDataInterface.hpp:24
virtual void addContentExpression(const std::string &expression)=0
Defines an expression for selecting chunks from a document to do tagging.
virtual ~PosTaggerInstanceInterface()
Destructor.
Definition: posTaggerInstanceInterface.hpp:27
Interface to define a POS tagger instance for creating the input for POS tagging to build the data an...
Definition: posTaggerInstanceInterface.hpp:23