Main Page   Namespace List   Class Hierarchy   Alphabetical List   Compound List   File List   Namespace Members   Compound Members   File Members   Related Pages  

IndriParser.hpp

Go to the documentation of this file.
00001 /*==========================================================================
00002  * Copyright (c) 2003-2004 University of Massachusetts.  All Rights Reserved.
00003  *
00004  * Use of the Lemur Toolkit for Language Modeling and Information Retrieval
00005  * is subject to the terms of the software license set forth in the LICENSE
00006  * file included with this software, and also available at
00007  * http://www.lemurproject.org/license.html
00008  *
00009  *==========================================================================
00010 */
00011 
00012 
00013 //
00014 // Parser
00015 // 
00016 // 11 May 2004 -- tds
00017 //
00018 
00019 #ifndef INDRI_PARSER_HPP
00020 #define INDRI_PARSER_HPP
00021 
00022 #include "indri/ObjectHandler.hpp"
00023 #include "indri/UnparsedDocument.hpp"
00024 #include "indri/ParsedDocument.hpp"
00025 #include <map>
00026 #include <vector>
00027 
00028 namespace indri {
00029   class Parser : public ObjectHandler<UnparsedDocument> {
00030   public:
00031     virtual ~Parser() {};
00032 
00033     virtual ParsedDocument* parse( UnparsedDocument* document ) = 0;
00034     virtual void setTags( const std::vector<std::string>& include,
00035                           const std::vector<std::string>& exclude,
00036                           const std::vector<std::string>& index,
00037                           const std::vector<std::string>& metadata,
00038                           const std::map<std::string, std::string>& conflations ) = 0;
00039 
00040     virtual void handle( UnparsedDocument* document ) = 0;
00041     virtual void setHandler( ObjectHandler<ParsedDocument>& handler ) = 0;
00042   };
00043 }
00044 
00045 #endif // INDRI_PARSER_HPP
00046 
00047 

Generated on Wed Nov 3 12:58:58 2004 for Lemur Toolkit by doxygen1.2.18