1
/* This file is part of Strigi Desktop Search
3
* Copyright (C) 2007 Jos van den Oever <jos@vandenoever.info>
5
* This library is free software; you can redistribute it and/or
6
* modify it under the terms of the GNU Library General Public
7
* License as published by the Free Software Foundation; either
8
* version 2 of the License, or (at your option) any later version.
10
* This library is distributed in the hope that it will be useful,
11
* but WITHOUT ANY WARRANTY; without even the implied warranty of
12
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
13
* Library General Public License for more details.
15
* You should have received a copy of the GNU Library General Public License
16
* along with this library; see the file COPYING.LIB. If not, write to
17
* the Free Software Foundation, Inc., 51 Franklin Street, Fifth Floor,
18
* Boston, MA 02110-1301, USA.
21
#include "pdfendanalyzer.h"
22
#include <strigi/strigiconfig.h>
23
#include "analysisresult.h"
24
#include "fieldtypes.h"
25
#include "textutils.h"
29
using namespace Strigi;
32
PdfEndAnalyzerFactory::registerFields(FieldRegister& reg) {
33
typeField = reg.typeField;
37
PdfEndAnalyzer::PdfEndAnalyzer(const PdfEndAnalyzerFactory* f) :factory(f) {
38
parser.setStreamHandler(this);
39
parser.setTextHandler(this);
42
PdfEndAnalyzer::handle(InputStream* s) {
45
char r = analysisresult->indexChild(str.str(), analysisresult->mTime(), s);
46
// how do we set the error message in this case?
47
return (r) ?Error :Ok;
50
PdfEndAnalyzer::handle(const std::string& s) {
51
analysisresult->addText(s.c_str(), (uint32_t)s.length());
55
PdfEndAnalyzer::checkHeader(const char* header, int32_t headersize) const {
56
return headersize > 7 && strncmp(header, "%PDF-1.", 7) == 0;
59
PdfEndAnalyzer::analyze(AnalysisResult& as, InputStream* in) {
62
StreamStatus r = parser.parse(in);
63
if (r != Eof) m_error.assign(parser.error());
64
analysisresult->addValue(factory->typeField,
65
"http://www.semanticdesktop.org/ontologies/2007/03/22/nfo#PaginatedTextDocument");
66
return (r == Eof) ?(signed char)0 :(signed char)-1;