summaryrefslogtreecommitdiffstats
path: root/reader/src/formats/util/TextFormatDetector.cpp
blob: 4a3ef678387ae97c41157487c781124b5eb61934 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
/*
 * Copyright (C) 2004-2012 Geometer Plus <[email protected]>
 *
 * This program is free software; you can redistribute it and/or modify
 * it under the terms of the GNU General Public License as published by
 * the Free Software Foundation; either version 2 of the License, or
 * (at your option) any later version.
 *
 * This program is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU General Public License for more details.
 *
 * You should have received a copy of the GNU General Public License
 * along with this program; if not, write to the Free Software
 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA
 * 02110-1301, USA.
 */

#include <cstring>
#include <cctype>
#include <algorithm>

#include <ZLInputStream.h>
#include <ZLUnicodeUtil.h>

#include "TextFormatDetector.h"

TextFormatDetector::TextFormatDetector() {
}

TextFormatDetector::~TextFormatDetector() {
}

bool TextFormatDetector::isHtml(ZLInputStream &stream) const {
	if (!stream.open()) {
		return false;
	}

	const std::size_t bufferSize = 1024;
	char *buffer = new char[bufferSize];
	std::string sixBytes; 
	int valuableBytesCounter = 0;
	bool skipFlag = true;
	while (valuableBytesCounter < 6) {
		std::size_t size = stream.read(buffer, bufferSize);
		if (size == 0) {
			break;
		}
		std::size_t index;
		for (index = 0; skipFlag && (index < size); ++index) {
			if (!std::isspace((unsigned char)buffer[index])) {
				skipFlag = false;
				break;
			}
		}
		if (!skipFlag && index < size) {
			int bytes = std::min(6 - valuableBytesCounter, (int)(size - index));
			sixBytes = std::string(buffer + index, bytes);
			valuableBytesCounter += bytes;
		}
	}
	stream.close();
	delete[] buffer;
	return ZLUnicodeUtil::toLower(sixBytes) == "<html>";
}

bool TextFormatDetector::isPPL(ZLInputStream &stream) const {
	if (!stream.open()) {
		return false;
	}

	char buffer[5]; 
	bool result = stream.read(buffer, 5) == 5 && std::strncmp(buffer, "PPL\r\n", 5) == 0;
	stream.close();
	return result;
}