Sonnet

guesslanguage.cpp
1/* This file is part of the KDE libraries
2 SPDX-FileCopyrightText: 2006 Jacob R Rideout <kde@jacobrideout.net>
3 SPDX-FileCopyrightText: 2009 Jakub Stachowski <qbast@go2.pl>
4 SPDX-FileCopyrightText: 2013 Martin Sandsmark <martin.sandsmark@kde.org>
5
6 SPDX-License-Identifier: LGPL-2.0-or-later
7*/
8
9#include <QCoreApplication>
10#include <QDataStream>
11#include <QFile>
12#include <QLocale>
13#include <QStandardPaths>
14
15#include "core_debug.h"
16#include "guesslanguage.h"
17#include "loader_p.h"
18#include "speller.h"
19#include "spellerplugin_p.h"
20#include "tokenizer_p.h"
21
22/*
23All language tags should be valid according to IETF BCP 47, as codified in RFC 4646.
24ISO 639-1 codes should be used for the language part except for cases where there
25exists no code, then 639-3 codes should be used. Country codes should only be used
26in special cases. Scripts can be differentiated by IANA subtags, available here:
27http://www.iana.org/assignments/language-subtag-registry
28The script tags correspond to ISO 15924
29
30An overview of the best practices concerning language tagging is available here:
31http://www.w3.org/International/articles/language-tags/Overview.en.php
32
33lang tags should use underscores (_) rather than hyphens (-) to separate subsections.
34
35EXCEPTIONS:
36For cases of known differences from the above tagging scheme and major
37spellcheckers such aspell/hunspell/myspell, the scheme used by the spell checkers
38shall be used. All exception shall be noted here:
39
40BCP SPELLCHECK
41az-Latn az
42
43*/
44
45namespace Sonnet
46{
47class GuessLanguagePrivate
48{
49public:
50 GuessLanguagePrivate();
51 // language trigram score
52 static QHash<QString, QHash<QString, int>> s_knownModels;
53
54 void loadModels();
55 QList<QChar::Script> findRuns(const QString &text);
56 QList<QString> createOrderedModel(const QString &content);
57 int distance(const QList<QString> &model, const QHash<QString, int> &knownModel);
58 QStringList guessFromTrigrams(const QString &sample, const QStringList &langs);
59 QStringList identify(const QString &sample, const QList<QChar::Script> &scripts);
60 QString guessFromDictionaries(const QString &sentence, const QStringList &candidates);
61
62 static QSet<QString> s_knownDictionaries;
63 static QMultiHash<QChar::Script, QString> s_scriptLanguages;
64 static QMap<QString, QString> s_dictionaryNameMap;
65
66 const int MIN_LENGTH;
67 int m_maxItems;
68 double m_minConfidence;
69};
70
71QHash<QString, QHash<QString, int>> GuessLanguagePrivate::s_knownModels;
72QSet<QString> GuessLanguagePrivate::s_knownDictionaries;
73QMultiHash<QChar::Script, QString> GuessLanguagePrivate::s_scriptLanguages;
74QMap<QString, QString> GuessLanguagePrivate::s_dictionaryNameMap;
75
76QStringList getNames(QLocale::Script script)
77{
78 QStringList locales;
79 const auto matchingLocales = QLocale::matchingLocales(QLocale::AnyLanguage, script, QLocale::AnyCountry);
80 locales.reserve(matchingLocales.size());
81 for (const QLocale &locale : matchingLocales) {
82 locales << locale.name();
83 }
84 return locales;
85}
86
87GuessLanguagePrivate::GuessLanguagePrivate()
88 : MIN_LENGTH(5)
89 , m_maxItems(1)
90 , m_minConfidence(0)
91{
92 if (!s_scriptLanguages.isEmpty()) {
93 return;
94 }
95
96 const QStringList languages = Loader::openLoader()->languages();
97 s_knownDictionaries = QSet<QString>(languages.begin(), languages.end());
98 QSet<QString> dictionaryLanguages;
99 for (const QString &dictName : std::as_const(s_knownDictionaries)) {
100 QString languageName = QLocale(dictName).name();
101 if (languageName.isEmpty()) {
102 qCWarning(SONNET_LOG_CORE) << "Unable to parse name for dictionary" << dictName;
103 continue;
104 }
105 dictionaryLanguages.insert(languageName);
106 }
107
108 QSet<QString> allLanguages;
109 for (int i = 0; i < int(QChar::ScriptCount); i++) {
110 QChar::Script script = static_cast<QChar::Script>(i);
111 QStringList names;
112 switch (script) {
114 names = getNames(QLocale::LatinScript);
115 break;
117 names = getNames(QLocale::GreekScript);
118 break;
120 names = getNames(QLocale::CyrillicScript);
121 break;
123 names = getNames(QLocale::ArmenianScript);
124 break;
126 names = getNames(QLocale::HebrewScript);
127 break;
129 names = getNames(QLocale::ArabicScript);
130 break;
132 names = getNames(QLocale::SyriacScript);
133 break;
135 names = getNames(QLocale::ThaanaScript);
136 break;
138 names = getNames(QLocale::DevanagariScript);
139 break;
141 names = getNames(QLocale::BengaliScript);
142 break;
144 names = getNames(QLocale::GurmukhiScript);
145 break;
147 names = getNames(QLocale::GujaratiScript);
148 break;
150 names = getNames(QLocale::OriyaScript);
151 break;
153 names = getNames(QLocale::TamilScript);
154 break;
156 names = getNames(QLocale::TeluguScript);
157 break;
159 names = getNames(QLocale::KannadaScript);
160 break;
162 names = getNames(QLocale::MalayalamScript);
163 break;
165 names = getNames(QLocale::SinhalaScript);
166 break;
168 names = getNames(QLocale::ThaiScript);
169 break;
171 names = getNames(QLocale::LaoScript);
172 break;
174 names = getNames(QLocale::TibetanScript);
175 break;
177 names = getNames(QLocale::MyanmarScript);
178 break;
180 names = getNames(QLocale::GeorgianScript);
181 break;
183 names = getNames(QLocale::HangulScript);
184 break;
186 names = getNames(QLocale::EthiopicScript);
187 break;
189 names = getNames(QLocale::CherokeeScript);
190 break;
192 names = getNames(QLocale::CanadianAboriginalScript);
193 break;
195 names = getNames(QLocale::OghamScript);
196 break;
198 names = getNames(QLocale::RunicScript);
199 break;
201 names = getNames(QLocale::KhmerScript);
202 break;
204 names = getNames(QLocale::MongolianScript);
205 break;
207 names = getNames(QLocale::HiraganaScript);
208 break;
210 names = getNames(QLocale::KatakanaScript);
211 break;
213 names = getNames(QLocale::BopomofoScript);
214 break;
216 names = getNames(QLocale::HanScript);
217 break;
218 case QChar::Script_Yi:
219 names = getNames(QLocale::YiScript);
220 break;
222 names = getNames(QLocale::OldItalicScript);
223 break;
225 names = getNames(QLocale::GothicScript);
226 break;
228 names = getNames(QLocale::DeseretScript);
229 break;
231 names = getNames(QLocale::TagalogScript);
232 break;
234 names = getNames(QLocale::HanunooScript);
235 break;
237 names = getNames(QLocale::BuhidScript);
238 break;
240 names = getNames(QLocale::TagbanwaScript);
241 break;
243 names = getNames(QLocale::CopticScript);
244 break;
246 names = getNames(QLocale::LimbuScript);
247 break;
249 names = getNames(QLocale::TaiLeScript);
250 break;
252 names = getNames(QLocale::LinearBScript);
253 break;
255 names = getNames(QLocale::UgariticScript);
256 break;
258 names = getNames(QLocale::ShavianScript);
259 break;
261 names = getNames(QLocale::OsmanyaScript);
262 break;
264 names = getNames(QLocale::CypriotScript);
265 break;
267 names = getNames(QLocale::BrailleScript);
268 break;
270 names = getNames(QLocale::BugineseScript);
271 break;
273 names = getNames(QLocale::NewTaiLueScript);
274 break;
276 names = getNames(QLocale::GlagoliticScript);
277 break;
279 names = getNames(QLocale::TifinaghScript);
280 break;
282 names = getNames(QLocale::SylotiNagriScript);
283 break;
285 names = getNames(QLocale::OldPersianScript);
286 break;
288 names = getNames(QLocale::KharoshthiScript);
289 break;
291 names = getNames(QLocale::BalineseScript);
292 break;
294 names = getNames(QLocale::CuneiformScript);
295 break;
297 names = getNames(QLocale::PhoenicianScript);
298 break;
300 names = getNames(QLocale::PhagsPaScript);
301 break;
303 names = getNames(QLocale::NkoScript);
304 break;
306 names = getNames(QLocale::SundaneseScript);
307 break;
309 names = getNames(QLocale::LepchaScript);
310 break;
312 names = getNames(QLocale::OlChikiScript);
313 break;
315 names = getNames(QLocale::VaiScript);
316 break;
318 names = getNames(QLocale::SaurashtraScript);
319 break;
321 names = getNames(QLocale::KayahLiScript);
322 break;
324 names = getNames(QLocale::RejangScript);
325 break;
327 names = getNames(QLocale::LycianScript);
328 break;
330 names = getNames(QLocale::CarianScript);
331 break;
333 names = getNames(QLocale::LydianScript);
334 break;
336 names = getNames(QLocale::ChamScript);
337 break;
339 names = getNames(QLocale::LannaScript);
340 break;
342 names = getNames(QLocale::TaiVietScript);
343 break;
345 names = getNames(QLocale::AvestanScript);
346 break;
348 names = getNames(QLocale::EgyptianHieroglyphsScript);
349 break;
351 names = getNames(QLocale::SamaritanScript);
352 break;
354 names = getNames(QLocale::FraserScript);
355 break;
357 names = getNames(QLocale::BamumScript);
358 break;
360 names = getNames(QLocale::JavaneseScript);
361 break;
363 names = getNames(QLocale::MeiteiMayekScript);
364 break;
366 names = getNames(QLocale::ImperialAramaicScript);
367 break;
369 names = getNames(QLocale::OldSouthArabianScript);
370 break;
372 names = getNames(QLocale::InscriptionalParthianScript);
373 break;
375 names = getNames(QLocale::InscriptionalPahlaviScript);
376 break;
378 names = getNames(QLocale::KaithiScript);
379 break;
381 names = getNames(QLocale::BatakScript);
382 break;
384 names = getNames(QLocale::BrahmiScript);
385 break;
387 names = getNames(QLocale::MandaeanScript);
388 break;
390 names = getNames(QLocale::ChakmaScript);
391 break;
394 names = getNames(QLocale::MeroiticCursiveScript);
395 names.append(getNames(QLocale::MeroiticScript));
396 break;
398 names = getNames(QLocale::PollardPhoneticScript);
399 break;
401 names = getNames(QLocale::SharadaScript);
402 break;
404 names = getNames(QLocale::SoraSompengScript);
405 break;
407 names = getNames(QLocale::TakriScript);
408 break;
410 names = getNames(QLocale::CaucasianAlbanianScript);
411 break;
413 names = getNames(QLocale::BassaVahScript);
414 break;
416 names = getNames(QLocale::DuployanScript);
417 break;
419 names = getNames(QLocale::ElbasanScript);
420 break;
422 names = getNames(QLocale::GranthaScript);
423 break;
425 names = getNames(QLocale::PahawhHmongScript);
426 break;
428 names = getNames(QLocale::KhojkiScript);
429 break;
431 names = getNames(QLocale::LinearAScript);
432 break;
434 names = getNames(QLocale::MahajaniScript);
435 break;
437 names = getNames(QLocale::ManichaeanScript);
438 break;
440 names = getNames(QLocale::MendeKikakuiScript);
441 break;
443 names = getNames(QLocale::ModiScript);
444 break;
446 names = getNames(QLocale::MroScript);
447 break;
449 names = getNames(QLocale::OldNorthArabianScript);
450 break;
452 names = getNames(QLocale::NabataeanScript);
453 break;
455 names = getNames(QLocale::PalmyreneScript);
456 break;
458 names = getNames(QLocale::PauCinHauScript);
459 break;
461 names = getNames(QLocale::OldPermicScript);
462 break;
464 names = getNames(QLocale::PsalterPahlaviScript);
465 break;
467 names = getNames(QLocale::SiddhamScript);
468 break;
470 names = getNames(QLocale::KhudawadiScript);
471 break;
473 names = getNames(QLocale::TirhutaScript);
474 break;
476 names = getNames(QLocale::VarangKshitiScript);
477 break;
479 names = getNames(QLocale::AhomScript);
480 break;
482 names = getNames(QLocale::AnatolianHieroglyphsScript);
483 break;
485 names = getNames(QLocale::HatranScript);
486 break;
488 names = getNames(QLocale::MultaniScript);
489 break;
491 names = getNames(QLocale::OldHungarianScript);
492 break;
498 break;
499 default:
500 qCDebug(SONNET_LOG_CORE) << "Unhandled script" << script;
501 break;
502 }
503 allLanguages.unite(QSet<QString>(names.constBegin(), names.constEnd()));
504
505 { // Remove unknown languages
506 QStringList pruned;
507 for (const QString &name : std::as_const(names)) {
508 if (!dictionaryLanguages.contains(name)) {
509 continue;
510 }
511 pruned.append(name);
512 }
513 names = pruned;
514 }
515
516 if (names.isEmpty()) {
517 continue;
518 }
519
520 for (const QString &name : std::as_const(names)) {
521 s_scriptLanguages.insert(script, name);
522 }
523 }
524
525 // Try to handle some badly named dictionaries
526 if (!allLanguages.contains(s_knownDictionaries)) {
527 QSet<QString> dicts(s_knownDictionaries);
528 dicts.subtract(allLanguages);
529 for (const QString &dictName : std::as_const(dicts)) {
530 QString languageName = QLocale(dictName).name();
531 if (languageName.isEmpty()) {
532 qCWarning(SONNET_LOG_CORE) << "Unable to parse language name" << dictName;
533 continue;
534 }
535 s_dictionaryNameMap[languageName] = dictName;
536 if (std::find(s_scriptLanguages.cbegin(), s_scriptLanguages.cend(), languageName) == s_scriptLanguages.cend()) {
537 qCWarning(SONNET_LOG_CORE) << "Unable to handle language from dictionary" << dictName << languageName;
538 }
539 }
540 }
541}
542
543GuessLanguage::GuessLanguage()
544 : d(new GuessLanguagePrivate)
545{
546}
547
549
550QString GuessLanguage::identify(const QString &text, const QStringList &suggestionsListIn) const
551{
552 if (text.isEmpty()) {
553 return QString();
554 }
555
556 // Filter for available dictionaries
557 QStringList suggestionsList;
558 for (const QString &suggestion : suggestionsListIn) {
559 if (d->s_knownDictionaries.contains(suggestion) && !suggestionsList.contains(suggestion)) {
560 suggestionsList.append(suggestion);
561 }
562 }
563
564 // Load the model on demand
565 if (d->s_knownModels.isEmpty()) {
566 d->loadModels();
567 }
568
569 const QList<QChar::Script> scriptsList = d->findRuns(text);
570
571 QStringList candidateLanguages = d->identify(text, scriptsList);
572
573 // if guessing from trigrams fail
574 if (candidateLanguages.isEmpty()) {
575 for (const QChar::Script script : scriptsList) {
576 const auto languagesList = d->s_scriptLanguages.values(script);
577 for (const QString &lang : languagesList) {
578 if (!d->s_knownModels.contains(lang)) {
579 candidateLanguages.append(lang);
580 }
581 }
582 }
583 }
584
585 // Hack for some bad dictionary names
586 for (int i = 0; i < candidateLanguages.count(); i++) {
587 if (d->s_dictionaryNameMap.contains(candidateLanguages[i])) {
588 candidateLanguages[i] = d->s_dictionaryNameMap.value(candidateLanguages[i]);
589 }
590 }
591
592 if (candidateLanguages.count() == 1) {
593 return candidateLanguages.first();
594 }
595
596 // Wasn't able to get a good guess with the trigrams, try checking all
597 // dictionaries for the suggested languages.
598 candidateLanguages.append(suggestionsList);
599 candidateLanguages.removeDuplicates();
600 QString identified = d->guessFromDictionaries(text, candidateLanguages);
601 if (!identified.isEmpty()) {
602 return identified;
603 }
604
605 qCDebug(SONNET_LOG_CORE()) << "Unable to identify string with dictionaries:" << text;
606
607 // None of our methods worked, just return the best suggestion
608 if (!suggestionsList.isEmpty()) {
609 return suggestionsList.first();
610 }
611
612 qCDebug(SONNET_LOG_CORE) << "Unable to find any suggestion for" << text;
613
614 // Not even any suggestions, give up
615 return QString();
616}
617
618void GuessLanguage::setLimits(int maxItems, double minConfidence)
619{
620 d->m_maxItems = maxItems;
621 d->m_minConfidence = minConfidence;
622}
623
624void GuessLanguagePrivate::loadModels()
625{
626 // use trigrams from resource file, easy to deploy on all platforms
627 const QString triMapFile = QStringLiteral(":/org.kde.sonnet/trigrams.map");
628 qCDebug(SONNET_LOG_CORE) << "Loading trigrams from" << triMapFile;
629
630 QFile sin(triMapFile);
631 if (!sin.open(QIODevice::ReadOnly)) {
632 qCWarning(SONNET_LOG_CORE) << "Sonnet: Unable to load trigram models from file" << triMapFile;
633 return;
634 }
635
636 QDataStream in(&sin);
637 in >> s_knownModels;
638
639 // Sanity check
640 QSet<QString> availableLanguages;
641 QHashIterator<QString, QHash<QString, int>> iterator(s_knownModels);
642 while (iterator.hasNext()) {
643 iterator.next();
644 if (iterator.value().count() < MAXGRAMS) {
645 qCWarning(SONNET_LOG_CORE) << iterator.key() << "is has only" << iterator.value().count() << "trigrams, expected" << MAXGRAMS;
646 }
647 availableLanguages.insert(iterator.key());
648 }
649 QSet<QString> knownLanguages(s_scriptLanguages.constBegin(), s_scriptLanguages.constEnd());
650 knownLanguages.subtract(availableLanguages);
651 if (!knownLanguages.isEmpty()) {
652 qCDebug(SONNET_LOG_CORE) << "Missing trigrams for languages:" << knownLanguages;
653 }
654}
655
656QList<QChar::Script> GuessLanguagePrivate::findRuns(const QString &text)
657{
658 QHash<QChar::Script, int> scriptCounts;
659
660 int totalCount = 0;
661
662 for (const QChar c : text) {
663 const QChar::Script script = c.script();
664
665 if (script == QChar::Script_Common || script == QChar::Script_Inherited) {
666 continue;
667 }
668
669 if (!c.isLetter()) {
670 continue;
671 }
672
673 scriptCounts[script]++;
674 totalCount++;
675 }
676
677 QList<QChar::Script> relevantScripts;
678
679 if (totalCount == 0) {
680 return relevantScripts;
681 }
682
683 if (scriptCounts.size() == 1) {
684 return {scriptCounts.cbegin().key()};
685 }
686
687 for (auto it = scriptCounts.cbegin(); it != scriptCounts.cend(); ++it) {
688 // return run types that used for 40% or more of the string
689 const int scriptCount = it.value();
690 const auto currentScript = it.key();
691 if (scriptCount * 100 / totalCount >= 40) {
692 relevantScripts << currentScript;
693 // always return basic latin if found more than 15%.
694 } else if (currentScript == QChar::Script_Latin && scriptCount * 100 / totalCount >= 15) {
695 relevantScripts << currentScript;
696 }
697 }
698
699 return relevantScripts;
700}
701
702QStringList GuessLanguagePrivate::identify(const QString &sample, const QList<QChar::Script> &scripts)
703{
704 if (sample.size() < MIN_LENGTH) {
705 return QStringList();
706 }
707
708 QStringList guesses;
709 for (const QChar::Script script : scripts) {
710 guesses.append(guessFromTrigrams(sample, s_scriptLanguages.values(script)));
711 }
712
713 return guesses;
714}
715
716QStringList GuessLanguagePrivate::guessFromTrigrams(const QString &sample, const QStringList &languages)
717{
718 QStringList ret;
719
720 const QList<QString> sampleTrigrams = createOrderedModel(sample);
721
722 // Sort by score
724 for (const QString &language : languages) {
725 if (s_knownModels.contains(language)) {
726 scores.insert(distance(sampleTrigrams, s_knownModels[language]), language);
727 }
728 }
729
730 // Skip if either no results or best result is completely unknown (distance >= maxdistance)
731 if (scores.isEmpty() || scores.firstKey() >= MAXGRAMS * sampleTrigrams.size()) {
732 qCDebug(SONNET_LOG_CORE) << "No scores for" << sample;
733 return ret;
734 }
735
736 int counter = 0;
737 double confidence = 0;
738
740 it.next();
741
742 QString prevItem = it.value();
743 int prevScore = it.key();
744
745 while (it.hasNext() && counter < m_maxItems && confidence < m_minConfidence) {
746 it.next();
747 counter++;
748 confidence += (it.key() - prevScore) / (double)it.key();
749 ret += prevItem;
750 prevItem = it.value();
751 prevScore = it.key();
752 }
753 if (counter < m_maxItems && confidence < m_minConfidence) {
754 ret += prevItem;
755 }
756
757 return ret;
758}
759
760QList<QString> GuessLanguagePrivate::createOrderedModel(const QString &content)
761{
762 QHash<QString, int> trigramCounts;
763
764 // collect trigrams
765 trigramCounts.reserve(content.size() - 2);
766 for (int i = 0; i < (content.size() - 2); ++i) {
767 QString tri = content.mid(i, 3).toLower();
768 trigramCounts[tri]++;
769 }
770
771 // invert the map <freq, trigram>
772 QList<QPair<int, QString>> trigramFrequencyList;
773 trigramFrequencyList.reserve(trigramCounts.size());
774
775 auto it = trigramCounts.constBegin();
776 for (; it != trigramCounts.constEnd(); ++it) {
777 const QChar *data = it.key().constData();
778 bool hasTwoSpaces = (data[1].isSpace() && (data[0].isSpace() || data[2].isSpace()));
779
780 if (!hasTwoSpaces) {
781 const int freq = it.value();
782 const QString &trigram = it.key();
783 trigramFrequencyList.append({freq, trigram});
784 }
785 }
786
787 // sort descending by frequency
788 std::sort(trigramFrequencyList.begin(), trigramFrequencyList.end(), [](const QPair<int, QString> &a, const QPair<int, QString> &b) {
789 return a.first > b.first;
790 });
791
792 QList<QString> orderedTrigrams;
793 orderedTrigrams.reserve(trigramFrequencyList.size());
794 for (const auto &tri : std::as_const(trigramFrequencyList)) {
795 orderedTrigrams.append(tri.second);
796 }
797
798 return orderedTrigrams;
799}
800
801int GuessLanguagePrivate::distance(const QList<QString> &model, const QHash<QString, int> &knownModel)
802{
803 int counter = -1;
804 int dist = 0;
805
806 for (const QString &trigram : model) {
807 const int val = knownModel.value(trigram, -1);
808 if (val != -1) {
809 dist += qAbs(++counter - val);
810 } else {
811 dist += MAXGRAMS;
812 }
813
814 if (counter == (MAXGRAMS - 1)) {
815 break;
816 }
817 }
818
819 return dist;
820}
821
822QString GuessLanguagePrivate::guessFromDictionaries(const QString &sentence, const QStringList &candidates)
823{
824 // Try to see how many languages we can get spell checking for
826 for (const QString &lang : candidates) {
827 if (!Loader::openLoader()->languages().contains(lang)) {
828 qCWarning(SONNET_LOG_CORE) << "Dictionary asked for invalid speller" << lang;
829 continue;
830 }
831 QSharedPointer<SpellerPlugin> plugin = Loader::openLoader()->cachedSpeller(lang);
832 if (!plugin.isNull()) {
833 spellers.append(plugin);
834 }
835 }
836
837 // If there's no spell checkers, give up
838 if (spellers.isEmpty()) {
839 return QString();
840 }
841
842 QMap<QString, int> correctHits;
843
844 WordTokenizer tokenizer(sentence);
845 while (tokenizer.hasNext()) {
846 Token word = tokenizer.next();
847 if (!tokenizer.isSpellcheckable()) {
848 continue;
849 }
850
851 for (int i = 0; i < spellers.count(); ++i) {
852 if (spellers[i]->isCorrect(word.toString())) {
853 correctHits[spellers[i]->language()]++;
854 }
855 }
856 }
857
858 if (correctHits.isEmpty()) {
859 return QString();
860 }
861
863 for (QMap<QString, int>::const_iterator itr = correctHits.constBegin(); itr != correctHits.constEnd(); ++itr) {
864 if (itr.value() > max.value()) {
865 max = itr;
866 }
867 }
868 return max.key();
869}
870}
QString identify(const QString &text, const QStringList &suggestions=QStringList()) const
Returns the 2 digit ISO 639-1 code for the language of the currently set text and.
~GuessLanguage()
Destructor.
void setLimits(int maxItems, double minConfidence)
Sets limits to number of languages returned by identify().
KEDUVOCDOCUMENT_EXPORT QStringList languages()
The sonnet namespace.
bool isSpace(char32_t ucs4)
const_iterator cbegin() const const
const_iterator cend() const const
const_iterator constBegin() const const
const_iterator constEnd() const const
void reserve(qsizetype size)
qsizetype size() const const
T value(const Key &key) const const
void append(QList< T > &&value)
iterator begin()
const_iterator constBegin() const const
const_iterator constEnd() const const
qsizetype count() const const
iterator end()
T & first()
bool isEmpty() const const
void reserve(qsizetype size)
qsizetype size() const const
QList< QLocale > matchingLocales(QLocale::Language language, QLocale::Script script, QLocale::Territory territory)
QString name() const const
const_iterator constBegin() const const
const_iterator constEnd() const const
bool isEmpty() const const
const_iterator constBegin() const const
const_iterator constEnd() const const
QList< T > values() const const
const Key & firstKey() const const
iterator insert(const Key &key, const T &value)
bool isEmpty() const const
bool contains(const QSet< T > &other) const const
iterator insert(const T &value)
QSet< T > & unite(const QSet< T > &other)
bool isNull() const const
QString & insert(qsizetype position, QChar ch)
bool isEmpty() const const
QString mid(qsizetype position, qsizetype n) const const
qsizetype size() const const
QString toLower() const const
bool contains(QLatin1StringView str, Qt::CaseSensitivity cs) const const
qsizetype removeDuplicates()
This file is part of the KDE documentation.
Documentation copyright © 1996-2025 The KDE developers.
Generated on Fri Jan 3 2025 11:50:10 by doxygen 1.12.0 written by Dimitri van Heesch, © 1997-2006

KDE's Doxygen guidelines are available online.