diff options
Diffstat (limited to 'debian/htdig/htdig-3.2.0b6/htdig/Parsable.h')
-rw-r--r-- | debian/htdig/htdig-3.2.0b6/htdig/Parsable.h | 57 |
1 files changed, 57 insertions, 0 deletions
diff --git a/debian/htdig/htdig-3.2.0b6/htdig/Parsable.h b/debian/htdig/htdig-3.2.0b6/htdig/Parsable.h new file mode 100644 index 00000000..7149fe7c --- /dev/null +++ b/debian/htdig/htdig-3.2.0b6/htdig/Parsable.h @@ -0,0 +1,57 @@ +// +// Parsable.h +// +// Parsable: Base class for file parsers (HTML, PDF, ExternalParser ...) +// +// Part of the ht://Dig package <http://www.htdig.org/> +// Copyright (c) 1995-2004 The ht://Dig Group +// For copyright details, see the file COPYING in your distribution +// or the GNU Library General Public License (LGPL) version 2 or later +// <http://www.gnu.org/copyleft/lgpl.html> +// +// $Id: Parsable.h,v 1.10 2004/05/28 13:15:15 lha Exp $ +// + +#ifndef _Parsable_h_ +#define _Parsable_h_ + +#include "htString.h" +#include "Retriever.h" + +class URL; + + +class Parsable +{ +public: + // + // Construction/Destruction + // + Parsable(); + virtual ~Parsable(); + + // + // Main parser interface. + // + virtual void parse(Retriever &retriever, URL &) = 0; + + // + // The rest of the members are used by the Document to provide us + // the data that we contain. + // + virtual void setContents(char *data, int length); + void addString(Retriever& retriever, char *s, int& wordindex, int slot); + void addKeywordString(Retriever& retriever, char *s, int& wordindex); + +protected: + String *contents; + int max_head_length; + int max_description_length; + int max_meta_description_length; + int max_keywords, keywordsCount; + unsigned int minimum_word_length; +}; + +#endif + + |