| 1 | /**************************************************************************** | 
|---|
| 2 | ** | 
|---|
| 3 | ** Copyright (C) 2011 Nokia Corporation and/or its subsidiary(-ies). | 
|---|
| 4 | ** All rights reserved. | 
|---|
| 5 | ** Contact: Nokia Corporation (qt-info@nokia.com) | 
|---|
| 6 | ** | 
|---|
| 7 | ** This file is part of the Qt Linguist of the Qt Toolkit. | 
|---|
| 8 | ** | 
|---|
| 9 | ** $QT_BEGIN_LICENSE:LGPL$ | 
|---|
| 10 | ** Commercial Usage | 
|---|
| 11 | ** Licensees holding valid Qt Commercial licenses may use this file in | 
|---|
| 12 | ** accordance with the Qt Commercial License Agreement provided with the | 
|---|
| 13 | ** Software or, alternatively, in accordance with the terms contained in | 
|---|
| 14 | ** a written agreement between you and Nokia. | 
|---|
| 15 | ** | 
|---|
| 16 | ** GNU Lesser General Public License Usage | 
|---|
| 17 | ** Alternatively, this file may be used under the terms of the GNU Lesser | 
|---|
| 18 | ** General Public License version 2.1 as published by the Free Software | 
|---|
| 19 | ** Foundation and appearing in the file LICENSE.LGPL included in the | 
|---|
| 20 | ** packaging of this file.  Please review the following information to | 
|---|
| 21 | ** ensure the GNU Lesser General Public License version 2.1 requirements | 
|---|
| 22 | ** will be met: http://www.gnu.org/licenses/old-licenses/lgpl-2.1.html. | 
|---|
| 23 | ** | 
|---|
| 24 | ** In addition, as a special exception, Nokia gives you certain additional | 
|---|
| 25 | ** rights.  These rights are described in the Nokia Qt LGPL Exception | 
|---|
| 26 | ** version 1.1, included in the file LGPL_EXCEPTION.txt in this package. | 
|---|
| 27 | ** | 
|---|
| 28 | ** GNU General Public License Usage | 
|---|
| 29 | ** Alternatively, this file may be used under the terms of the GNU | 
|---|
| 30 | ** General Public License version 3.0 as published by the Free Software | 
|---|
| 31 | ** Foundation and appearing in the file LICENSE.GPL included in the | 
|---|
| 32 | ** packaging of this file.  Please review the following information to | 
|---|
| 33 | ** ensure the GNU General Public License version 3.0 requirements will be | 
|---|
| 34 | ** met: http://www.gnu.org/copyleft/gpl.html. | 
|---|
| 35 | ** | 
|---|
| 36 | ** If you have questions regarding the use of this file, please contact | 
|---|
| 37 | ** Nokia at qt-info@nokia.com. | 
|---|
| 38 | ** $QT_END_LICENSE$ | 
|---|
| 39 | ** | 
|---|
| 40 | ****************************************************************************/ | 
|---|
| 41 |  | 
|---|
| 42 | #include "lupdate.h" | 
|---|
| 43 |  | 
|---|
| 44 | #include "simtexth.h" | 
|---|
| 45 | #include "translator.h" | 
|---|
| 46 |  | 
|---|
| 47 | #include <QtCore/QCoreApplication> | 
|---|
| 48 | #include <QtCore/QDebug> | 
|---|
| 49 | #include <QtCore/QMap> | 
|---|
| 50 | #include <QtCore/QStringList> | 
|---|
| 51 | #include <QtCore/QTextCodec> | 
|---|
| 52 | #include <QtCore/QVector> | 
|---|
| 53 |  | 
|---|
| 54 | QT_BEGIN_NAMESPACE | 
|---|
| 55 |  | 
|---|
| 56 | class LU { | 
|---|
| 57 | Q_DECLARE_TR_FUNCTIONS(LUpdate) | 
|---|
| 58 | }; | 
|---|
| 59 |  | 
|---|
| 60 | static bool isDigitFriendly(QChar c) | 
|---|
| 61 | { | 
|---|
| 62 | return c.isPunct() || c.isSpace(); | 
|---|
| 63 | } | 
|---|
| 64 |  | 
|---|
| 65 | static int numberLength(const QString &s, int i) | 
|---|
| 66 | { | 
|---|
| 67 | if (i >= s.size() || !s.at(i).isDigit()) | 
|---|
| 68 | return 0; | 
|---|
| 69 |  | 
|---|
| 70 | int pos = i; | 
|---|
| 71 | do { | 
|---|
| 72 | ++i; | 
|---|
| 73 | } while (i < s.size() | 
|---|
| 74 | && (s.at(i).isDigit() | 
|---|
| 75 | || (isDigitFriendly(s[i]) | 
|---|
| 76 | && i + 1 < s.size() | 
|---|
| 77 | && (s[i + 1].isDigit() | 
|---|
| 78 | || (isDigitFriendly(s[i + 1]) | 
|---|
| 79 | && i + 2 < s.size() | 
|---|
| 80 | && s[i + 2].isDigit()))))); | 
|---|
| 81 | return i - pos; | 
|---|
| 82 | } | 
|---|
| 83 |  | 
|---|
| 84 |  | 
|---|
| 85 | /* | 
|---|
| 86 | Returns a version of 'key' where all numbers have been replaced by zeroes.  If | 
|---|
| 87 | there were none, returns "". | 
|---|
| 88 | */ | 
|---|
| 89 | static QString zeroKey(const QString &key) | 
|---|
| 90 | { | 
|---|
| 91 | QString zeroed; | 
|---|
| 92 | bool metSomething = false; | 
|---|
| 93 |  | 
|---|
| 94 | for (int i = 0; i < key.size(); ++i) { | 
|---|
| 95 | int len = numberLength(key, i); | 
|---|
| 96 | if (len > 0) { | 
|---|
| 97 | i += len; | 
|---|
| 98 | zeroed.append(QLatin1Char('0')); | 
|---|
| 99 | metSomething = true; | 
|---|
| 100 | } else { | 
|---|
| 101 | zeroed.append(key.at(i)); | 
|---|
| 102 | } | 
|---|
| 103 | } | 
|---|
| 104 | return metSomething ? zeroed : QString(); | 
|---|
| 105 | } | 
|---|
| 106 |  | 
|---|
| 107 | static QString translationAttempt(const QString &oldTranslation, | 
|---|
| 108 | const QString &oldSource, const QString &newSource) | 
|---|
| 109 | { | 
|---|
| 110 | int p = zeroKey(oldSource).count(QLatin1Char('0')); | 
|---|
| 111 | QString attempt; | 
|---|
| 112 | QStringList oldNumbers; | 
|---|
| 113 | QStringList newNumbers; | 
|---|
| 114 | QVector<bool> met(p); | 
|---|
| 115 | QVector<int> matchedYet(p); | 
|---|
| 116 | int i, j; | 
|---|
| 117 | int k = 0, ell, best; | 
|---|
| 118 | int m, n; | 
|---|
| 119 | int pass; | 
|---|
| 120 |  | 
|---|
| 121 | /* | 
|---|
| 122 | This algorithm is hard to follow, so we'll consider an example | 
|---|
| 123 | all along: oldTranslation is "XeT 3.0", oldSource is "TeX 3.0" | 
|---|
| 124 | and newSource is "XeT 3.1". | 
|---|
| 125 |  | 
|---|
| 126 | First, we set up two tables: oldNumbers and newNumbers. In our | 
|---|
| 127 | example, oldNumber[0] is "3.0" and newNumber[0] is "3.1". | 
|---|
| 128 | */ | 
|---|
| 129 | for (i = 0, j = 0; i < oldSource.size(); i++, j++) { | 
|---|
| 130 | m = numberLength(oldSource, i); | 
|---|
| 131 | n = numberLength(newSource, j); | 
|---|
| 132 | if (m > 0) { | 
|---|
| 133 | oldNumbers.append(oldSource.mid(i, m + 1)); | 
|---|
| 134 | newNumbers.append(newSource.mid(j, n + 1)); | 
|---|
| 135 | i += m; | 
|---|
| 136 | j += n; | 
|---|
| 137 | met[k] = false; | 
|---|
| 138 | matchedYet[k] = 0; | 
|---|
| 139 | k++; | 
|---|
| 140 | } | 
|---|
| 141 | } | 
|---|
| 142 |  | 
|---|
| 143 | /* | 
|---|
| 144 | We now go over the old translation, "XeT 3.0", one letter at a | 
|---|
| 145 | time, looking for numbers found in oldNumbers. Whenever such a | 
|---|
| 146 | number is met, it is replaced with its newNumber equivalent. In | 
|---|
| 147 | our example, the "3.0" of "XeT 3.0" becomes "3.1". | 
|---|
| 148 | */ | 
|---|
| 149 | for (i = 0; i < oldTranslation.length(); i++) { | 
|---|
| 150 | attempt += oldTranslation[i]; | 
|---|
| 151 | for (k = 0; k < p; k++) { | 
|---|
| 152 | if (oldTranslation[i] == oldNumbers[k][matchedYet[k]]) | 
|---|
| 153 | matchedYet[k]++; | 
|---|
| 154 | else | 
|---|
| 155 | matchedYet[k] = 0; | 
|---|
| 156 | } | 
|---|
| 157 |  | 
|---|
| 158 | /* | 
|---|
| 159 | Let's find out if the last character ended a match. We make | 
|---|
| 160 | two passes over the data. In the first pass, we try to | 
|---|
| 161 | match only numbers that weren't matched yet; if that fails, | 
|---|
| 162 | the second pass does the trick. This is useful in some | 
|---|
| 163 | suspicious cases, flagged below. | 
|---|
| 164 | */ | 
|---|
| 165 | for (pass = 0; pass < 2; pass++) { | 
|---|
| 166 | best = p; // an impossible value | 
|---|
| 167 | for (k = 0; k < p; k++) { | 
|---|
| 168 | if ((!met[k] || pass > 0) && | 
|---|
| 169 | matchedYet[k] == oldNumbers[k].length() && | 
|---|
| 170 | numberLength(oldTranslation, i + 1 - matchedYet[k]) == matchedYet[k]) { | 
|---|
| 171 | // the longer the better | 
|---|
| 172 | if (best == p || matchedYet[k] > matchedYet[best]) | 
|---|
| 173 | best = k; | 
|---|
| 174 | } | 
|---|
| 175 | } | 
|---|
| 176 | if (best != p) { | 
|---|
| 177 | attempt.truncate(attempt.length() - matchedYet[best]); | 
|---|
| 178 | attempt += newNumbers[best]; | 
|---|
| 179 | met[best] = true; | 
|---|
| 180 | for (k = 0; k < p; k++) | 
|---|
| 181 | matchedYet[k] = 0; | 
|---|
| 182 | break; | 
|---|
| 183 | } | 
|---|
| 184 | } | 
|---|
| 185 | } | 
|---|
| 186 |  | 
|---|
| 187 | /* | 
|---|
| 188 | We flag two kinds of suspicious cases. They are identified as | 
|---|
| 189 | such with comments such as "{2000?}" at the end. | 
|---|
| 190 |  | 
|---|
| 191 | Example of the first kind: old source text "TeX 3.0" translated | 
|---|
| 192 | as "XeT 2.0" is flagged "TeX 2.0 {3.0?}", no matter what the | 
|---|
| 193 | new text is. | 
|---|
| 194 | */ | 
|---|
| 195 | for (k = 0; k < p; k++) { | 
|---|
| 196 | if (!met[k]) | 
|---|
| 197 | attempt += QLatin1String(" {") + newNumbers[k] + QLatin1String("?}"); | 
|---|
| 198 | } | 
|---|
| 199 |  | 
|---|
| 200 | /* | 
|---|
| 201 | Example of the second kind: "1 of 1" translated as "1 af 1", | 
|---|
| 202 | with new source text "1 of 2", generates "1 af 2 {1 or 2?}" | 
|---|
| 203 | because it's not clear which of "1 af 2" and "2 af 1" is right. | 
|---|
| 204 | */ | 
|---|
| 205 | for (k = 0; k < p; k++) { | 
|---|
| 206 | for (ell = 0; ell < p; ell++) { | 
|---|
| 207 | if (k != ell && oldNumbers[k] == oldNumbers[ell] && | 
|---|
| 208 | newNumbers[k] < newNumbers[ell]) | 
|---|
| 209 | attempt += QLatin1String(" {") + newNumbers[k] + QLatin1String(" or ") + | 
|---|
| 210 | newNumbers[ell] + QLatin1String("?}"); | 
|---|
| 211 | } | 
|---|
| 212 | } | 
|---|
| 213 | return attempt; | 
|---|
| 214 | } | 
|---|
| 215 |  | 
|---|
| 216 |  | 
|---|
| 217 | /* | 
|---|
| 218 | Augments a Translator with translations easily derived from | 
|---|
| 219 | similar existing (probably obsolete) translations. | 
|---|
| 220 |  | 
|---|
| 221 | For example, if "TeX 3.0" is translated as "XeT 3.0" and "TeX 3.1" | 
|---|
| 222 | has no translation, "XeT 3.1" is added to the translator and is | 
|---|
| 223 | marked Unfinished. | 
|---|
| 224 |  | 
|---|
| 225 | Returns the number of additional messages that this heuristic translated. | 
|---|
| 226 | */ | 
|---|
| 227 | int applyNumberHeuristic(Translator &tor) | 
|---|
| 228 | { | 
|---|
| 229 | QMap<QString, QPair<QString, QString> > translated; | 
|---|
| 230 | QVector<bool> untranslated(tor.messageCount()); | 
|---|
| 231 | int inserted = 0; | 
|---|
| 232 |  | 
|---|
| 233 | for (int i = 0; i < tor.messageCount(); ++i) { | 
|---|
| 234 | const TranslatorMessage &msg = tor.message(i); | 
|---|
| 235 | bool hasTranslation = msg.isTranslated(); | 
|---|
| 236 | if (msg.type() == TranslatorMessage::Unfinished) { | 
|---|
| 237 | if (!hasTranslation) | 
|---|
| 238 | untranslated[i] = true; | 
|---|
| 239 | } else if (hasTranslation && msg.translations().count() == 1) { | 
|---|
| 240 | const QString &key = zeroKey(msg.sourceText()); | 
|---|
| 241 | if (!key.isEmpty()) | 
|---|
| 242 | translated.insert(key, qMakePair(msg.sourceText(), msg.translation())); | 
|---|
| 243 | } | 
|---|
| 244 | } | 
|---|
| 245 |  | 
|---|
| 246 | for (int i = 0; i < tor.messageCount(); ++i) { | 
|---|
| 247 | if (untranslated[i]) { | 
|---|
| 248 | TranslatorMessage &msg = tor.message(i); | 
|---|
| 249 | const QString &key = zeroKey(msg.sourceText()); | 
|---|
| 250 | if (!key.isEmpty()) { | 
|---|
| 251 | QMap<QString, QPair<QString, QString> >::ConstIterator t = | 
|---|
| 252 | translated.constFind(key); | 
|---|
| 253 | if (t != translated.constEnd() && t->first != msg.sourceText()) { | 
|---|
| 254 | msg.setTranslation(translationAttempt(t->second, t->first, | 
|---|
| 255 | msg.sourceText())); | 
|---|
| 256 | inserted++; | 
|---|
| 257 | } | 
|---|
| 258 | } | 
|---|
| 259 | } | 
|---|
| 260 | } | 
|---|
| 261 | return inserted; | 
|---|
| 262 | } | 
|---|
| 263 |  | 
|---|
| 264 |  | 
|---|
| 265 | /* | 
|---|
| 266 | Augments a Translator with trivially derived translations. | 
|---|
| 267 |  | 
|---|
| 268 | For example, if "Enabled:" is consistendly translated as "Eingeschaltet:" no | 
|---|
| 269 | matter the context or the comment, "Eingeschaltet:" is added as the | 
|---|
| 270 | translation of any untranslated "Enabled:" text and is marked Unfinished. | 
|---|
| 271 |  | 
|---|
| 272 | Returns the number of additional messages that this heuristic translated. | 
|---|
| 273 | */ | 
|---|
| 274 |  | 
|---|
| 275 | int applySameTextHeuristic(Translator &tor) | 
|---|
| 276 | { | 
|---|
| 277 | QMap<QString, QStringList> translated; | 
|---|
| 278 | QMap<QString, bool> avoid; // Want a QTreeSet, in fact | 
|---|
| 279 | QVector<bool> untranslated(tor.messageCount()); | 
|---|
| 280 | int inserted = 0; | 
|---|
| 281 |  | 
|---|
| 282 | for (int i = 0; i < tor.messageCount(); ++i) { | 
|---|
| 283 | const TranslatorMessage &msg = tor.message(i); | 
|---|
| 284 | if (!msg.isTranslated()) { | 
|---|
| 285 | if (msg.type() == TranslatorMessage::Unfinished) | 
|---|
| 286 | untranslated[i] = true; | 
|---|
| 287 | } else { | 
|---|
| 288 | const QString &key = msg.sourceText(); | 
|---|
| 289 | QMap<QString, QStringList>::ConstIterator t = translated.constFind(key); | 
|---|
| 290 | if (t != translated.constEnd()) { | 
|---|
| 291 | /* | 
|---|
| 292 | The same source text is translated at least two | 
|---|
| 293 | different ways. Do nothing then. | 
|---|
| 294 | */ | 
|---|
| 295 | if (*t != msg.translations()) { | 
|---|
| 296 | translated.remove(key); | 
|---|
| 297 | avoid.insert(key, true); | 
|---|
| 298 | } | 
|---|
| 299 | } else if (!avoid.contains(key)) { | 
|---|
| 300 | translated.insert(key, msg.translations()); | 
|---|
| 301 | } | 
|---|
| 302 | } | 
|---|
| 303 | } | 
|---|
| 304 |  | 
|---|
| 305 | for (int i = 0; i < tor.messageCount(); ++i) { | 
|---|
| 306 | if (untranslated[i]) { | 
|---|
| 307 | TranslatorMessage &msg = tor.message(i); | 
|---|
| 308 | QMap<QString, QStringList>::ConstIterator t = translated.constFind(msg.sourceText()); | 
|---|
| 309 | if (t != translated.constEnd()) { | 
|---|
| 310 | msg.setTranslations(*t); | 
|---|
| 311 | ++inserted; | 
|---|
| 312 | } | 
|---|
| 313 | } | 
|---|
| 314 | } | 
|---|
| 315 | return inserted; | 
|---|
| 316 | } | 
|---|
| 317 |  | 
|---|
| 318 |  | 
|---|
| 319 |  | 
|---|
| 320 | /* | 
|---|
| 321 | Merges two Translator objects. The first one | 
|---|
| 322 | is a set of source texts and translations for a previous version of | 
|---|
| 323 | the internationalized program; the second one is a set of fresh | 
|---|
| 324 | source texts newly extracted from the source code, without any | 
|---|
| 325 | translation yet. | 
|---|
| 326 | */ | 
|---|
| 327 |  | 
|---|
| 328 | Translator merge(const Translator &tor, const Translator &virginTor, | 
|---|
| 329 | UpdateOptions options, QString &err) | 
|---|
| 330 | { | 
|---|
| 331 | int known = 0; | 
|---|
| 332 | int neww = 0; | 
|---|
| 333 | int obsoleted = 0; | 
|---|
| 334 | int similarTextHeuristicCount = 0; | 
|---|
| 335 |  | 
|---|
| 336 | Translator outTor; | 
|---|
| 337 | outTor.setLanguageCode(tor.languageCode()); | 
|---|
| 338 | outTor.setSourceLanguageCode(tor.sourceLanguageCode()); | 
|---|
| 339 | outTor.setLocationsType(tor.locationsType()); | 
|---|
| 340 | outTor.setCodecName(tor.codecName()); | 
|---|
| 341 |  | 
|---|
| 342 | /* | 
|---|
| 343 | The types of all the messages from the vernacular translator | 
|---|
| 344 | are updated according to the virgin translator. | 
|---|
| 345 | */ | 
|---|
| 346 | foreach (TranslatorMessage m, tor.messages()) { | 
|---|
| 347 | TranslatorMessage::Type newType = TranslatorMessage::Finished; | 
|---|
| 348 |  | 
|---|
| 349 | if (m.sourceText().isEmpty() && m.id().isEmpty()) { | 
|---|
| 350 | // context/file comment | 
|---|
| 351 | TranslatorMessage mv = virginTor.find(m.context()); | 
|---|
| 352 | if (!mv.isNull()) | 
|---|
| 353 | m.setComment(mv.comment()); | 
|---|
| 354 | } else { | 
|---|
| 355 | TranslatorMessage mv; | 
|---|
| 356 | int mvi = virginTor.find(m); | 
|---|
| 357 | if (mvi < 0) { | 
|---|
| 358 | if (!(options & HeuristicSimilarText)) { | 
|---|
| 359 | makeObsolete: | 
|---|
| 360 | newType = TranslatorMessage::Obsolete; | 
|---|
| 361 | if (m.type() != TranslatorMessage::Obsolete) | 
|---|
| 362 | obsoleted++; | 
|---|
| 363 | m.clearReferences(); | 
|---|
| 364 | } else { | 
|---|
| 365 | mv = virginTor.find(m.context(), m.comment(), m.allReferences()); | 
|---|
| 366 | if (mv.isNull()) { | 
|---|
| 367 | // did not find it in the virgin, mark it as obsolete | 
|---|
| 368 | goto makeObsolete; | 
|---|
| 369 | } else { | 
|---|
| 370 | // Do not just accept it if its on the same line number, | 
|---|
| 371 | // but different source text. | 
|---|
| 372 | // Also check if the texts are more or less similar before | 
|---|
| 373 | // we consider them to represent the same message... | 
|---|
| 374 | if (getSimilarityScore(m.sourceText(), mv.sourceText()) >= textSimilarityThreshold) { | 
|---|
| 375 | // It is just slightly modified, assume that it is the same string | 
|---|
| 376 |  | 
|---|
| 377 | // Mark it as unfinished. (Since the source text | 
|---|
| 378 | // was changed it might require re-translating...) | 
|---|
| 379 | newType = TranslatorMessage::Unfinished; | 
|---|
| 380 | ++similarTextHeuristicCount; | 
|---|
| 381 | neww++; | 
|---|
| 382 |  | 
|---|
| 383 | outdateSource: | 
|---|
| 384 | m.setOldSourceText(m.sourceText()); | 
|---|
| 385 | m.setSourceText(mv.sourceText()); | 
|---|
| 386 | const QString &oldpluralsource = m.extra(QLatin1String("po-msgid_plural")); | 
|---|
| 387 | if (!oldpluralsource.isEmpty()) { | 
|---|
| 388 | m.setExtra(QLatin1String("po-old_msgid_plural"), oldpluralsource); | 
|---|
| 389 | m.unsetExtra(QLatin1String("po-msgid_plural")); | 
|---|
| 390 | } | 
|---|
| 391 | goto copyAttribs; // Update secondary references | 
|---|
| 392 | } else { | 
|---|
| 393 | // The virgin and vernacular sourceTexts are so | 
|---|
| 394 | // different that we could not find it. | 
|---|
| 395 | goto makeObsolete; | 
|---|
| 396 | } | 
|---|
| 397 | } | 
|---|
| 398 | } | 
|---|
| 399 | } else { | 
|---|
| 400 | mv = virginTor.message(mvi); | 
|---|
| 401 | if (!mv.id().isEmpty() | 
|---|
| 402 | && (mv.context() != m.context() | 
|---|
| 403 | || mv.sourceText() != m.sourceText() | 
|---|
| 404 | || mv.comment() != m.comment())) { | 
|---|
| 405 | known++; | 
|---|
| 406 | newType = TranslatorMessage::Unfinished; | 
|---|
| 407 | m.setContext(mv.context()); | 
|---|
| 408 | m.setComment(mv.comment()); | 
|---|
| 409 | if (mv.sourceText() != m.sourceText()) | 
|---|
| 410 | goto outdateSource; | 
|---|
| 411 | } else { | 
|---|
| 412 | switch (m.type()) { | 
|---|
| 413 | case TranslatorMessage::Finished: | 
|---|
| 414 | default: | 
|---|
| 415 | if (m.isPlural() == mv.isPlural()) { | 
|---|
| 416 | newType = TranslatorMessage::Finished; | 
|---|
| 417 | } else { | 
|---|
| 418 | newType = TranslatorMessage::Unfinished; | 
|---|
| 419 | } | 
|---|
| 420 | known++; | 
|---|
| 421 | break; | 
|---|
| 422 | case TranslatorMessage::Unfinished: | 
|---|
| 423 | newType = TranslatorMessage::Unfinished; | 
|---|
| 424 | known++; | 
|---|
| 425 | break; | 
|---|
| 426 | case TranslatorMessage::Obsolete: | 
|---|
| 427 | newType = TranslatorMessage::Unfinished; | 
|---|
| 428 | neww++; | 
|---|
| 429 | } | 
|---|
| 430 | } | 
|---|
| 431 |  | 
|---|
| 432 | // Always get the filename and linenumber info from the | 
|---|
| 433 | // virgin Translator, in case it has changed location. | 
|---|
| 434 | // This should also enable us to read a file that does not | 
|---|
| 435 | // have the <location> element. | 
|---|
| 436 | // why not use operator=()? Because it overwrites e.g. userData. | 
|---|
| 437 | copyAttribs: | 
|---|
| 438 | m.setReferences(mv.allReferences()); | 
|---|
| 439 | m.setPlural(mv.isPlural()); | 
|---|
| 440 | m.setUtf8(mv.isUtf8()); | 
|---|
| 441 | m.setExtraComment(mv.extraComment()); | 
|---|
| 442 | m.setId(mv.id()); | 
|---|
| 443 | } | 
|---|
| 444 | } | 
|---|
| 445 |  | 
|---|
| 446 | m.setType(newType); | 
|---|
| 447 | outTor.append(m); | 
|---|
| 448 | } | 
|---|
| 449 |  | 
|---|
| 450 | /* | 
|---|
| 451 | Messages found only in the virgin translator are added to the | 
|---|
| 452 | vernacular translator. | 
|---|
| 453 | */ | 
|---|
| 454 | foreach (const TranslatorMessage &mv, virginTor.messages()) { | 
|---|
| 455 | if (mv.sourceText().isEmpty() && mv.id().isEmpty()) { | 
|---|
| 456 | if (tor.contains(mv.context())) | 
|---|
| 457 | continue; | 
|---|
| 458 | } else { | 
|---|
| 459 | if (tor.find(mv) >= 0) | 
|---|
| 460 | continue; | 
|---|
| 461 | if (options & HeuristicSimilarText) { | 
|---|
| 462 | TranslatorMessage m = tor.find(mv.context(), mv.comment(), mv.allReferences()); | 
|---|
| 463 | if (!m.isNull()) { | 
|---|
| 464 | if (getSimilarityScore(m.sourceText(), mv.sourceText()) >= textSimilarityThreshold) | 
|---|
| 465 | continue; | 
|---|
| 466 | } | 
|---|
| 467 | } | 
|---|
| 468 | } | 
|---|
| 469 | if (options & NoLocations) | 
|---|
| 470 | outTor.append(mv); | 
|---|
| 471 | else | 
|---|
| 472 | outTor.appendSorted(mv); | 
|---|
| 473 | if (!mv.sourceText().isEmpty() || !mv.id().isEmpty()) | 
|---|
| 474 | ++neww; | 
|---|
| 475 | } | 
|---|
| 476 |  | 
|---|
| 477 | /* | 
|---|
| 478 | The same-text heuristic handles cases where a message has an | 
|---|
| 479 | obsolete counterpart with a different context or comment. | 
|---|
| 480 | */ | 
|---|
| 481 | int sameTextHeuristicCount = (options & HeuristicSameText) ? applySameTextHeuristic(outTor) : 0; | 
|---|
| 482 |  | 
|---|
| 483 | /* | 
|---|
| 484 | The number heuristic handles cases where a message has an | 
|---|
| 485 | obsolete counterpart with mostly numbers differing in the | 
|---|
| 486 | source text. | 
|---|
| 487 | */ | 
|---|
| 488 | int sameNumberHeuristicCount = (options & HeuristicNumber) ? applyNumberHeuristic(outTor) : 0; | 
|---|
| 489 |  | 
|---|
| 490 | if (options & Verbose) { | 
|---|
| 491 | int totalFound = neww + known; | 
|---|
| 492 | err += LU::tr("    Found %n source text(s) (%1 new and %2 already existing)\n", 0, totalFound).arg(neww).arg(known); | 
|---|
| 493 |  | 
|---|
| 494 | if (obsoleted) { | 
|---|
| 495 | if (options & NoObsolete) { | 
|---|
| 496 | err += LU::tr("    Removed %n obsolete entries\n", 0, obsoleted); | 
|---|
| 497 | } else { | 
|---|
| 498 | err += LU::tr("    Kept %n obsolete entries\n", 0, obsoleted); | 
|---|
| 499 | } | 
|---|
| 500 | } | 
|---|
| 501 |  | 
|---|
| 502 | if (sameNumberHeuristicCount) | 
|---|
| 503 | err += LU::tr("    Number heuristic provided %n translation(s)\n", | 
|---|
| 504 | 0, sameNumberHeuristicCount); | 
|---|
| 505 | if (sameTextHeuristicCount) | 
|---|
| 506 | err += LU::tr("    Same-text heuristic provided %n translation(s)\n", | 
|---|
| 507 | 0, sameTextHeuristicCount); | 
|---|
| 508 | if (similarTextHeuristicCount) | 
|---|
| 509 | err += LU::tr("    Similar-text heuristic provided %n translation(s)\n", | 
|---|
| 510 | 0, similarTextHeuristicCount); | 
|---|
| 511 | } | 
|---|
| 512 | return outTor; | 
|---|
| 513 | } | 
|---|
| 514 |  | 
|---|
| 515 | QT_END_NAMESPACE | 
|---|