summaryrefslogtreecommitdiffstats
path: root/reader/src/formats/html/HtmlDescriptionReader.cpp
blob: 6ebcb8bbe3dd9c55f6e488cc5cf81acc83c70c33 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
/*
 * Copyright (C) 2004-2012 Geometer Plus <[email protected]>
 *
 * This program is free software; you can redistribute it and/or modify
 * it under the terms of the GNU General Public License as published by
 * the Free Software Foundation; either version 2 of the License, or
 * (at your option) any later version.
 *
 * This program is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU General Public License for more details.
 *
 * You should have received a copy of the GNU General Public License
 * along with this program; if not, write to the Free Software
 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA
 * 02110-1301, USA.
 */

#include "HtmlDescriptionReader.h"

#include "../../library/Book.h"

HtmlDescriptionReader::HtmlDescriptionReader(Book &book) : HtmlReader(book.encoding()), myBook(book) {
	myBook.setTitle("");
}

void HtmlDescriptionReader::startDocumentHandler() {
	myReadTitle = false;
}

void HtmlDescriptionReader::endDocumentHandler() {
	if (!myBook.title().empty()) {
		const char *titleStart = myBook.title().data();
		const char *titleEnd = titleStart + myBook.title().length();
		std::string newTitle;
		myConverter->convert(newTitle, titleStart, titleEnd);
		myBook.setTitle(newTitle);
	}
}

bool HtmlDescriptionReader::tagHandler(const HtmlTag &tag) {
	if (tag.Name == "TITLE") {
		if (myReadTitle && !tag.Start) {
			myBook.setTitle(myBuffer);
			myBuffer.erase();
		}
		myReadTitle = tag.Start && myBook.title().empty();
		return true;
	} else if (tag.Start && tag.Name == "META") {
		std::vector<HtmlAttribute>::const_iterator it = tag.Attributes.begin();
		for (; it != tag.Attributes.end(); ++it) {
			if (it->Name == "CONTENT") {
				break;
			}
		}
		if (it != tag.Attributes.end()) {
			const std::string prefix = "charset=";
			std::size_t index = it->Value.find(prefix);
			if (index != std::string::npos) {
				std::string charset = it->Value.substr(index + prefix.length());
				index = charset.find(';');
				if (index != std::string::npos) {
					charset = charset.substr(0, index);
				}
				index = charset.find(' ');
				if (index != std::string::npos) {
					charset = charset.substr(0, index);
				}
				myBook.setEncoding(charset);
			}
		}
	}
	return tag.Name != "BODY";
}

bool HtmlDescriptionReader::characterDataHandler(const char *text, std::size_t len, bool) {
	if (myReadTitle) {
		myBuffer.append(text, len);
	}
	return true;
}