1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
|
/**
This file is part of Kiten, a KDE Japanese Reference Tool...
Copyright (C) 2001 Jason Katz-Brown <[email protected]>
This program is free software; you can redistribute it and/or modify
it under the terms of the GNU General Public License as published by
the Free Software Foundation; either version 2 of the License, or
(at your option) any later version.
This program is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
GNU General Public License for more details.
You should have received a copy of the GNU General Public License
along with this program; if not, write to the Free Software
Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301
USA
**/
#include <kdebug.h>
#include <kstandarddirs.h>
#include <tdemessagebox.h>
#include <tdelocale.h>
#include <tqfile.h>
#include <tqregexp.h>
#include <tqtextcodec.h>
#include "deinf.h"
Deinf::Index::Index()
{
loaded = false;
}
void Deinf::Index::load()
{
if (loaded)
return;
TDEStandardDirs *dirs = TDEGlobal::dirs();
TQString vconj = dirs->findResource("data", "kiten/vconj");
if (vconj.isNull())
{
KMessageBox::error(0, i18n("Verb deinflection information not found, so verb deinflection cannot be used."));
return;
}
TQFile f(vconj);
if (!f.open(IO_ReadOnly))
{
KMessageBox::error(0, i18n("Verb deinflection information could not be loaded, so verb deinflection cannot be used."));
return;
}
TQTextStream t(&f);
t.setCodec(TQTextCodec::codecForName("eucJP"));
for(TQString text = t.readLine(); !t.eof() && text.at(0) != '$'; text = t.readLine())
{
if(text.at(0) != '#')
{
unsigned int number = text.left(2).stripWhiteSpace().toUInt();
TQString name = text.right(text.length() - 2).stripWhiteSpace();
names[number] = name;
}
}
for(TQString text = t.readLine(); !text.isEmpty(); text = t.readLine())
{
if(text.at(0) != '#')
{
TQStringList things(TQStringList::split(TQChar('\t'), text));
Conjugation conj;
conj.ending = things.first();
conj.replace = (*things.at(1));
conj.num = things.last().toUInt();
list.append(conj);
}
}
f.close();
loaded = true;
}
namespace
{
TQStringList possibleConjugations(const TQString &text)
{
TQStringList endings;
for (unsigned i = 0; i < text.length(); ++i)
endings.append(text.right(i));
return endings;
}
}
TQStringList Deinf::Index::deinflect(const TQString &text, TQStringList &name)
{
load();
TQStringList endings = possibleConjugations(text);
TQStringList ret;
for (TQValueListIterator <Conjugation> it = list.begin(); it != list.end(); ++it)
{
TQStringList matches(endings.grep(TQRegExp(TQString("^") + (*it).ending)));
if (matches.size() > 0) // a match
{
name.append(names[(*it).num]);
//kdDebug() << "match ending: " << (*it).ending << "; replace: " << (*it).replace << "; name: " << names[(*it).num] << endl;
TQString tmp(text);
tmp.replace(TQRegExp((*it).ending + "*", false, true), (*it).replace);
ret.append(tmp);
}
}
return ret;
}
|