SILVERCODERS DocToText  4.0.1512
Converts DOC, XLS, XLSB, PPT, RTF, ODF (ODT, ODS, ODP), OOXML (DOCX, XLSX, PPTX), iWork (PAGES, NUMBERS, KEYNOTE), ODFXML (FODP, FODS, FODT), PDF, EML and HTML documents to plain text. Extracts metadata and annotations.
 All Classes Functions Enumerations Pages
doctotext::PlainTextExtractor Member List

This is the complete list of members for doctotext::PlainTextExtractor, including all inherited members.

extractMetadata(const std::string &file_name, Metadata &metadata)doctotext::PlainTextExtractor
extractMetadata(const char *file_name, Metadata &metadata)doctotext::PlainTextExtractor
extractMetadata(const char *buffer, size_t size, Metadata &metadata)doctotext::PlainTextExtractor
extractMetadata(ParserType parser_type, bool fallback, const std::string &file_name, Metadata &metadata)doctotext::PlainTextExtractor
extractMetadata(ParserType parser_type, bool fallback, const char *file_name, Metadata &metadata)doctotext::PlainTextExtractor
extractMetadata(ParserType parser_type, bool fallback, const char *buffer, size_t size, Metadata &metadata)doctotext::PlainTextExtractor
getAttachments(std::vector< Attachment > &attachments) const doctotext::PlainTextExtractor
getAttachments(const Attachment *&attachments, size_t &number_of_attachments) const doctotext::PlainTextExtractor
getAttachments() const doctotext::PlainTextExtractor
getNumberOfAttachments() const doctotext::PlainTextExtractor
getNumberOfLinks() const doctotext::PlainTextExtractor
getParsedLinks(std::vector< Link > &links) const doctotext::PlainTextExtractor
getParsedLinks(const Link *&links, size_t &number_of_links) const doctotext::PlainTextExtractor
getParsedLinks() const doctotext::PlainTextExtractor
PARSER_AUTO enum value (defined in doctotext::PlainTextExtractor)doctotext::PlainTextExtractor
PARSER_DOC enum value (defined in doctotext::PlainTextExtractor)doctotext::PlainTextExtractor
PARSER_EML enum value (defined in doctotext::PlainTextExtractor)doctotext::PlainTextExtractor
PARSER_HTML enum value (defined in doctotext::PlainTextExtractor)doctotext::PlainTextExtractor
PARSER_IWORK enum value (defined in doctotext::PlainTextExtractor)doctotext::PlainTextExtractor
PARSER_ODF_OOXML enum value (defined in doctotext::PlainTextExtractor)doctotext::PlainTextExtractor
PARSER_ODFXML enum value (defined in doctotext::PlainTextExtractor)doctotext::PlainTextExtractor
PARSER_PDF enum value (defined in doctotext::PlainTextExtractor)doctotext::PlainTextExtractor
PARSER_PPT enum value (defined in doctotext::PlainTextExtractor)doctotext::PlainTextExtractor
PARSER_RTF enum value (defined in doctotext::PlainTextExtractor)doctotext::PlainTextExtractor
PARSER_TXT enum value (defined in doctotext::PlainTextExtractor)doctotext::PlainTextExtractor
PARSER_XLS enum value (defined in doctotext::PlainTextExtractor)doctotext::PlainTextExtractor
PARSER_XLSB enum value (defined in doctotext::PlainTextExtractor)doctotext::PlainTextExtractor
ParserType enum namedoctotext::PlainTextExtractor
parserTypeByFileContent(const std::string &file_name, ParserType &parser_type)doctotext::PlainTextExtractor
parserTypeByFileContent(const char *file_name, ParserType &parser_type)doctotext::PlainTextExtractor
parserTypeByFileContent(const char *buffer, size_t size, ParserType &parser_type)doctotext::PlainTextExtractor
parserTypeByFileExtension(const std::string &file_name)doctotext::PlainTextExtractor
parserTypeByFileExtension(const char *file_name)doctotext::PlainTextExtractor
PlainTextExtractor(ParserType parser_type=PARSER_AUTO)doctotext::PlainTextExtractor
processFile(const std::string &file_name, std::string &text)doctotext::PlainTextExtractor
processFile(const char *file_name, char *&text)doctotext::PlainTextExtractor
processFile(const char *buffer, size_t size, char *&text)doctotext::PlainTextExtractor
processFile(const char *buffer, size_t size, std::string &text)doctotext::PlainTextExtractor
processFile(ParserType parser_type, bool fallback, const std::string &file_name, std::string &text)doctotext::PlainTextExtractor
processFile(ParserType parser_type, bool fallback, const char *file_name, char *&text)doctotext::PlainTextExtractor
processFile(ParserType parser_type, bool fallback, const char *buffer, size_t size, char *&text)doctotext::PlainTextExtractor
processFile(ParserType parser_type, bool fallback, const char *buffer, size_t size, std::string &text)doctotext::PlainTextExtractor
setFormattingStyle(const FormattingStyle &style)doctotext::PlainTextExtractor
setLogStream(std::ostream &log_stream)doctotext::PlainTextExtractor
setManageXmlParser(bool manage)doctotext::PlainTextExtractor
setVerboseLogging(bool verbose)doctotext::PlainTextExtractor
setXmlParseMode(XmlParseMode mode) (defined in doctotext::PlainTextExtractor)doctotext::PlainTextExtractor
~PlainTextExtractor() (defined in doctotext::PlainTextExtractor)doctotext::PlainTextExtractor