1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199
|
/*
This file is part of Kiten, a KDE Japanese Reference Tool
SPDX-FileCopyrightText: 2001 Jason Katz-Brown <jason@katzbrown.com>
SPDX-FileCopyrightText: 2006 Joseph Kerian <jkerian@gmail.com>
SPDX-FileCopyrightText: 2006 Eric Kjeldergaard <kjelderg@gmail.com>
SPDX-FileCopyrightText: 2011 Daniel E. Moctezuma <democtezuma@gmail.com>
SPDX-License-Identifier: LGPL-2.0-or-later
*/
#include "deinflection.h"
#include "dictfileedict.h"
#include "dictquery.h"
#include "entryedict.h"
#include "entrylist.h"
#include <KLocalizedString>
#include <KMessageBox>
#include <QFile>
#include <QHash>
#include <QList>
#include <QStandardPaths>
#include <QString>
#include <QStringDecoder>
#include <QTextStream>
using namespace Qt::StringLiterals;
// This is a very primative form of information hiding
// But C++ can get stupid with static QT objects...
// So this turns out to be much, much easier
// TODO: Fix this for thread safety/functionality (I'm presuming it's broken atm)
// Declare our constants
QList<Deinflection::Conjugation> *Deinflection::conjugationList = nullptr;
Deinflection::Deinflection(const QString &name)
: m_deinflectionLabel(QString())
, m_wordType(QString())
, m_dictionaryName(name)
{
}
QString *Deinflection::getDeinflectionLabel()
{
return &m_deinflectionLabel;
}
QString *Deinflection::getWordType()
{
return &m_wordType;
}
EntryList *Deinflection::search(const DictQuery &query, const QList<QString> &preliminaryResults)
{
if (conjugationList == nullptr) {
return nullptr;
}
m_deinflectionLabel = QString();
m_wordType = QString();
auto entries = new EntryList();
QStringList edictTypesList;
edictTypesList.append(EdictFormatting::Adjectives);
edictTypesList.append(EdictFormatting::Verbs);
QString edictTypes = edictTypesList.join(QLatin1Char(','));
for (const QString &item : preliminaryResults) {
EntryEdict *entry = makeEntry(item);
QStringListIterator it(entry->getTypesList());
bool matched = false;
while (it.hasNext() && !matched) {
if (edictTypes.contains(it.next())) {
entries->append(entry);
matched = true;
}
}
if (!matched)
delete entry;
}
auto results = new EntryList();
EntryList::EntryIterator it(*entries);
while (it.hasNext()) {
auto entry = static_cast<EntryEdict *>(it.next());
QString text = query.getWord();
if (text.isEmpty()) {
text = query.getPronunciation();
if (text.isEmpty()) {
entries->deleteAll();
delete entries;
delete results;
return nullptr;
}
}
QString word = entry->getWord();
for (const Deinflection::Conjugation &conj : *conjugationList) {
if (text.endsWith(conj.ending) && word.endsWith(conj.replace) && text.startsWith(word.left(word.length() - conj.replace.length()))) {
QString replacement = text;
replacement.truncate(text.length() - conj.ending.length());
replacement += conj.replace;
if (word == replacement) {
if (m_deinflectionLabel.isEmpty()) {
m_deinflectionLabel = conj.label;
}
if (m_wordType.isEmpty()) {
if (entry->isVerb()) {
m_wordType = i18n("verb");
} else if (entry->isAdjective()) {
m_wordType = i18n("adjective");
}
}
results->append(entry);
break;
}
}
}
}
delete entries;
return results;
}
bool Deinflection::load()
{
if (conjugationList != nullptr) {
return true;
}
conjugationList = new QList<Conjugation>;
QString vconj = QStandardPaths::locate(QStandardPaths::GenericDataLocation, QStringLiteral("kiten/vconj"));
// Find the file
if (vconj.isEmpty()) {
KMessageBox::error(nullptr, i18n("Verb deinflection information not found, so verb deinflection cannot be used."));
return false;
}
QHash<unsigned long, QString> names;
// Open the file
QFile f(vconj);
if (!f.open(QIODevice::ReadOnly)) {
KMessageBox::error(nullptr, i18n("Verb deinflection information could not be loaded, so verb deinflection cannot be used."));
return false;
}
QStringDecoder decoder("EUC-JP");
const QString decoded = decoder(f.readAll());
QTextStream t(decoded.toUtf8());
// The file starts out with a number -> name list of the conjugation types
// In the format "#[#] NAME\n"
// The next section beginning is flagged with a $ at the beginning of the line
for (QString text = t.readLine(); !t.atEnd() && text.at(0) != '$'_L1; text = t.readLine()) {
if (text.at(0) != '#'_L1) {
unsigned long number = text.left(2).trimmed().toULong();
QString name = text.right(text.length() - 2).trimmed();
names[number] = name;
}
}
// Now for the actual conjugation data
// Format is "NUMBER_FROM_LIST_ABOVE ENDING_TO_REPLACE\n"
QString replacement = QString();
for (QString text = t.readLine(); !t.atEnd(); text = t.readLine()) {
if (!text.isEmpty() && text.at(0) == '$'_L1) {
replacement = text.right(1).trimmed();
} else if (!text.trimmed().isEmpty() && text.at(0) != '#'_L1) {
unsigned long labelIndex = text.section(' '_L1, 0, 1).trimmed().toULong();
Conjugation conj;
conj.label = names.value(labelIndex);
conj.ending = text.section(' '_L1, 2).trimmed();
conj.replace = replacement;
conjugationList->append(conj);
}
}
f.close();
return true;
}
inline EntryEdict *Deinflection::makeEntry(const QString &entry)
{
return new EntryEdict(m_dictionaryName, entry);
}
|