You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
tdeedu/kiten/deinf.cpp

124 lines
3.1 KiB

/**
This file is part of Kiten, a KDE Japanese Reference Tool...
Copyright (C) 2001 Jason Katz-Brown <jason@katzbrown.com>
This program is free software; you can redistribute it and/or modify
it under the terms of the GNU General Public License as published by
the Free Software Foundation; either version 2 of the License, or
(at your option) any later version.
This program is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
GNU General Public License for more details.
You should have received a copy of the GNU General Public License
along with this program; if not, write to the Free Software
Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301
USA
**/
#include <kdebug.h>
#include <kstandarddirs.h>
#include <tdemessagebox.h>
#include <tdelocale.h>
#include <tqfile.h>
#include <tqregexp.h>
#include <tqtextcodec.h>
#include "deinf.h"
Deinf::Index::Index()
{
loaded = false;
}
void Deinf::Index::load()
{
if (loaded)
return;
TDEStandardDirs *dirs = TDEGlobal::dirs();
TQString vconj = dirs->findResource("data", "kiten/vconj");
if (vconj.isNull())
{
KMessageBox::error(0, i18n("Verb deinflection information not found, so verb deinflection cannot be used."));
return;
}
TQFile f(vconj);
if (!f.open(IO_ReadOnly))
{
KMessageBox::error(0, i18n("Verb deinflection information could not be loaded, so verb deinflection cannot be used."));
return;
}
TQTextStream t(&f);
t.setCodec(TQTextCodec::codecForName("eucJP"));
for(TQString text = t.readLine(); !t.eof() && text.at(0) != '$'; text = t.readLine())
{
if(text.at(0) != '#')
{
unsigned int number = text.left(2).stripWhiteSpace().toUInt();
TQString name = text.right(text.length() - 2).stripWhiteSpace();
names[number] = name;
}
}
for(TQString text = t.readLine(); !text.isEmpty(); text = t.readLine())
{
if(text.at(0) != '#')
{
TQStringList things(TQStringList::split(TQChar('\t'), text));
Conjugation conj;
conj.ending = things.first();
conj.replace = (*things.at(1));
conj.num = things.last().toUInt();
list.append(conj);
}
}
f.close();
loaded = true;
}
namespace
{
TQStringList possibleConjugations(const TQString &text)
{
TQStringList endings;
for (unsigned i = 0; i < text.length(); ++i)
endings.append(text.right(i));
return endings;
}
}
TQStringList Deinf::Index::deinflect(const TQString &text, TQStringList &name)
{
load();
TQStringList endings = possibleConjugations(text);
TQStringList ret;
for (TQValueListIterator <Conjugation> it = list.begin(); it != list.end(); ++it)
{
TQStringList matches(endings.grep(TQRegExp(TQString("^") + (*it).ending)));
if (matches.size() > 0) // a match
{
name.append(names[(*it).num]);
//kdDebug() << "match ending: " << (*it).ending << "; replace: " << (*it).replace << "; name: " << names[(*it).num] << endl;
TQString tmp(text);
tmp.replace(TQRegExp((*it).ending + "*", false, true), (*it).replace);
ret.append(tmp);
}
}
return ret;
}