10 #ifndef _STRUS_ANALYZER_DOCUMENT_CLASS_DETECTOR_INTERFACE_HPP_INCLUDED
11 #define _STRUS_ANALYZER_DOCUMENT_CLASS_DETECTOR_INTERFACE_HPP_INCLUDED
33 const std::string& scheme,
34 const std::string& mimeType,
35 const std::vector<std::string>& select_expressions,
36 const std::vector<std::string>& reject_expressions)=0;
Defines a description of the properties of an original document processed by the segmenter.
Definition: documentClass.hpp:21
Structure describing the MIME type plus some attributes that could be relevant for analysis of a docu...
virtual bool detect(analyzer::DocumentClass &dclass, const char *contentBegin, std::size_t contentBeginSize, bool isComplete) const =0
Scans the start of a document to detect its classification attributes (mime type, etc...
Defines a detector that returns a content description for a document content it recognizes.
Definition: documentClassDetectorInterface.hpp:21
virtual ~DocumentClassDetectorInterface()
Destructor.
Definition: documentClassDetectorInterface.hpp:25
virtual void defineDocumentSchemeDetector(const std::string &scheme, const std::string &mimeType, const std::vector< std::string > &select_expressions, const std::vector< std::string > &reject_expressions)=0
Define a detector for a document scheme.