Some checks failed
Docker. / Ubuntu (push) Has been cancelled
User-agent updater. / User-agent (push) Failing after 15s
Lock Threads / lock (push) Failing after 10s
Waiting for answer. / waiting-for-answer (push) Failing after 22s
Needs user action. / needs-user-action (push) Failing after 8s
Can't reproduce. / cant-reproduce (push) Failing after 8s
Close stale issues and PRs / stale (push) Has been cancelled
444 lines
12 KiB
C++
444 lines
12 KiB
C++
// This file is part of Desktop App Toolkit,
|
|
// a set of libraries for developing nice desktop applications.
|
|
//
|
|
// For license and copyright information please follow this link:
|
|
// https://github.com/desktop-app/legal/blob/master/LEGAL
|
|
//
|
|
#include "spellcheck/platform/win/spellcheck_win.h"
|
|
|
|
#include "base/platform/base_platform_info.h"
|
|
#include "spellcheck/third_party/hunspell_controller.h"
|
|
|
|
#include <wrl/client.h>
|
|
#include <spellcheck.h>
|
|
|
|
#include <QtCore/QDir>
|
|
#include <QtCore/QLocale>
|
|
#include <QVector>
|
|
|
|
using namespace Microsoft::WRL;
|
|
|
|
namespace Platform::Spellchecker {
|
|
|
|
namespace {
|
|
|
|
constexpr auto kChunk = 5000;
|
|
|
|
// Seems like ISpellChecker API has bugs for Persian language (aka Farsi).
|
|
[[nodiscard]] inline bool IsPersianLanguage(const QString &langTag) {
|
|
return langTag.startsWith(QStringLiteral("fa"));
|
|
}
|
|
|
|
[[nodiscard]] inline LPCWSTR Q2WString(QStringView string) {
|
|
return (LPCWSTR)string.utf16();
|
|
}
|
|
|
|
[[nodiscard]] inline auto SystemLanguages() {
|
|
const auto appdata = qEnvironmentVariable("appdata");
|
|
const auto dir = QDir(appdata + QString("\\Microsoft\\Spelling"));
|
|
auto list = QStringList(SystemLanguage());
|
|
list << (dir.exists()
|
|
? dir.entryList(QDir::Dirs | QDir::NoDotAndDotDot)
|
|
: QLocale::system().uiLanguages());
|
|
list.removeDuplicates();
|
|
return list | ranges::to_vector;
|
|
}
|
|
|
|
// WindowsSpellChecker class is used to store all the COM objects and
|
|
// control their lifetime. The class also provides wrappers for
|
|
// ISpellCheckerFactory and ISpellChecker APIs. All COM calls are on the
|
|
// background thread.
|
|
class WindowsSpellChecker {
|
|
public:
|
|
WindowsSpellChecker();
|
|
|
|
void addWord(LPCWSTR word);
|
|
void removeWord(LPCWSTR word);
|
|
void ignoreWord(LPCWSTR word);
|
|
[[nodiscard]] bool checkSpelling(LPCWSTR word);
|
|
void fillSuggestionList(
|
|
LPCWSTR wrongWord,
|
|
std::vector<QString> *optionalSuggestions);
|
|
void checkSpellingText(
|
|
LPCWSTR text,
|
|
MisspelledWords *misspelledWordRanges,
|
|
int offset);
|
|
[[nodiscard]] std::vector<QString> systemLanguages();
|
|
void chunkedCheckSpellingText(
|
|
QStringView textView,
|
|
MisspelledWords *misspelledWords);
|
|
|
|
private:
|
|
void createFactory();
|
|
[[nodiscard]] bool isLanguageSupported(const LPCWSTR &lang);
|
|
void createSpellCheckers();
|
|
|
|
ComPtr<ISpellCheckerFactory> _spellcheckerFactory;
|
|
std::vector<std::pair<QString, ComPtr<ISpellChecker>>> _spellcheckerMap;
|
|
|
|
};
|
|
|
|
WindowsSpellChecker::WindowsSpellChecker() {
|
|
createFactory();
|
|
createSpellCheckers();
|
|
}
|
|
|
|
void WindowsSpellChecker::createFactory() {
|
|
if (FAILED(CoCreateInstance(
|
|
__uuidof(SpellCheckerFactory),
|
|
nullptr,
|
|
(CLSCTX_INPROC_SERVER | CLSCTX_LOCAL_SERVER),
|
|
IID_PPV_ARGS(&_spellcheckerFactory)))) {
|
|
_spellcheckerFactory = nullptr;
|
|
}
|
|
}
|
|
|
|
void WindowsSpellChecker::createSpellCheckers() {
|
|
if (!_spellcheckerFactory) {
|
|
return;
|
|
}
|
|
for (const auto &lang : SystemLanguages()) {
|
|
const auto wlang = Q2WString(lang);
|
|
if (!isLanguageSupported(wlang)) {
|
|
continue;
|
|
}
|
|
if (ranges::contains(ranges::views::keys(_spellcheckerMap), lang)) {
|
|
continue;
|
|
}
|
|
auto spellchecker = ComPtr<ISpellChecker>();
|
|
auto hr = _spellcheckerFactory->CreateSpellChecker(
|
|
wlang,
|
|
&spellchecker);
|
|
if (SUCCEEDED(hr)) {
|
|
_spellcheckerMap.push_back({ lang, spellchecker });
|
|
}
|
|
}
|
|
}
|
|
|
|
bool WindowsSpellChecker::isLanguageSupported(const LPCWSTR &lang) {
|
|
if (!_spellcheckerFactory) {
|
|
return false;
|
|
}
|
|
|
|
auto isSupported = (BOOL)false;
|
|
auto hr = _spellcheckerFactory->IsSupported(lang, &isSupported);
|
|
return SUCCEEDED(hr) && isSupported;
|
|
}
|
|
|
|
void WindowsSpellChecker::fillSuggestionList(
|
|
LPCWSTR wrongWord,
|
|
std::vector<QString> *optionalSuggestions) {
|
|
auto i = 0;
|
|
for (const auto &[langTag, spellchecker] : _spellcheckerMap) {
|
|
if (IsPersianLanguage(langTag)) {
|
|
continue;
|
|
}
|
|
auto suggestions = ComPtr<IEnumString>();
|
|
auto hr = spellchecker->Suggest(wrongWord, &suggestions);
|
|
if (hr != S_OK) {
|
|
continue;
|
|
}
|
|
|
|
while (true) {
|
|
wchar_t *suggestion = nullptr;
|
|
hr = suggestions->Next(1, &suggestion, nullptr);
|
|
if (hr != S_OK) {
|
|
break;
|
|
}
|
|
const auto guess = QString::fromWCharArray(
|
|
suggestion,
|
|
wcslen(suggestion));
|
|
CoTaskMemFree(suggestion);
|
|
if (!guess.isEmpty()) {
|
|
optionalSuggestions->push_back(guess);
|
|
if (++i >= kMaxSuggestions) {
|
|
return;
|
|
}
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
bool WindowsSpellChecker::checkSpelling(LPCWSTR word) {
|
|
for (const auto &[_, spellchecker] : _spellcheckerMap) {
|
|
auto spellingErrors = ComPtr<IEnumSpellingError>();
|
|
auto hr = spellchecker->Check(word, &spellingErrors);
|
|
|
|
if (SUCCEEDED(hr) && spellingErrors) {
|
|
auto spellingError = ComPtr<ISpellingError>();
|
|
auto startIndex = ULONG(0);
|
|
auto errorLength = ULONG(0);
|
|
auto action = CORRECTIVE_ACTION_NONE;
|
|
hr = spellingErrors->Next(&spellingError);
|
|
if (SUCCEEDED(hr) &&
|
|
spellingError &&
|
|
SUCCEEDED(spellingError->get_StartIndex(&startIndex)) &&
|
|
SUCCEEDED(spellingError->get_Length(&errorLength)) &&
|
|
SUCCEEDED(spellingError->get_CorrectiveAction(&action)) &&
|
|
(action == CORRECTIVE_ACTION_GET_SUGGESTIONS ||
|
|
action == CORRECTIVE_ACTION_REPLACE)) {
|
|
} else {
|
|
return true;
|
|
}
|
|
}
|
|
}
|
|
return false;
|
|
}
|
|
|
|
void WindowsSpellChecker::checkSpellingText(
|
|
LPCWSTR text,
|
|
MisspelledWords *misspelledWordRanges,
|
|
int offset) {
|
|
// The spellchecker marks words not from its own language as misspelled.
|
|
// So we only return words that are marked
|
|
// as misspelled in all spellcheckers.
|
|
auto misspelledWords = MisspelledWords();
|
|
|
|
constexpr auto isActionGood = [](auto action) {
|
|
return action == CORRECTIVE_ACTION_GET_SUGGESTIONS
|
|
|| action == CORRECTIVE_ACTION_REPLACE;
|
|
};
|
|
|
|
for (const auto &[langTag, spellchecker] : _spellcheckerMap) {
|
|
auto spellingErrors = ComPtr<IEnumSpellingError>();
|
|
|
|
auto hr = IsPersianLanguage(langTag)
|
|
? spellchecker->Check(text, &spellingErrors)
|
|
: spellchecker->ComprehensiveCheck(text, &spellingErrors);
|
|
if (!(SUCCEEDED(hr) && spellingErrors)) {
|
|
continue;
|
|
}
|
|
|
|
auto tempMisspelled = MisspelledWords();
|
|
auto spellingError = ComPtr<ISpellingError>();
|
|
for (; hr == S_OK; hr = spellingErrors->Next(&spellingError)) {
|
|
auto startIndex = ULONG(0);
|
|
auto errorLength = ULONG(0);
|
|
auto action = CORRECTIVE_ACTION_NONE;
|
|
|
|
if (!(SUCCEEDED(hr)
|
|
&& spellingError
|
|
&& SUCCEEDED(spellingError->get_StartIndex(&startIndex))
|
|
&& SUCCEEDED(spellingError->get_Length(&errorLength))
|
|
&& SUCCEEDED(spellingError->get_CorrectiveAction(&action))
|
|
&& isActionGood(action))) {
|
|
continue;
|
|
}
|
|
const auto word = std::pair(
|
|
(int)startIndex + offset,
|
|
(int)errorLength);
|
|
if (misspelledWords.empty()
|
|
|| ranges::contains(misspelledWords, word)) {
|
|
tempMisspelled.push_back(std::move(word));
|
|
}
|
|
}
|
|
// If the tempMisspelled vector is empty at least once,
|
|
// it means that the all words will be correct in the end
|
|
// and it makes no sense to check other languages.
|
|
if (tempMisspelled.empty()) {
|
|
return;
|
|
}
|
|
misspelledWords = std::move(tempMisspelled);
|
|
}
|
|
if (offset) {
|
|
for (auto &m : misspelledWords) {
|
|
misspelledWordRanges->push_back(std::move(m));
|
|
}
|
|
} else {
|
|
*misspelledWordRanges = misspelledWords;
|
|
}
|
|
}
|
|
|
|
void WindowsSpellChecker::addWord(LPCWSTR word) {
|
|
for (const auto &[_, spellchecker] : _spellcheckerMap) {
|
|
spellchecker->Add(word);
|
|
}
|
|
}
|
|
|
|
void WindowsSpellChecker::removeWord(LPCWSTR word) {
|
|
for (const auto &[_, spellchecker] : _spellcheckerMap) {
|
|
auto spellchecker2 = ComPtr<ISpellChecker2>();
|
|
spellchecker->QueryInterface(IID_PPV_ARGS(&spellchecker2));
|
|
if (spellchecker2) {
|
|
spellchecker2->Remove(word);
|
|
}
|
|
}
|
|
}
|
|
|
|
void WindowsSpellChecker::ignoreWord(LPCWSTR word) {
|
|
for (const auto &[_, spellchecker] : _spellcheckerMap) {
|
|
spellchecker->Ignore(word);
|
|
}
|
|
}
|
|
|
|
std::vector<QString> WindowsSpellChecker::systemLanguages() {
|
|
return ranges::views::keys(_spellcheckerMap) | ranges::to_vector;
|
|
}
|
|
|
|
void WindowsSpellChecker::chunkedCheckSpellingText(
|
|
QStringView textView,
|
|
MisspelledWords *misspelledWords) {
|
|
auto i = 0;
|
|
auto chunkBuffer = std::vector<wchar_t>();
|
|
|
|
while (i != textView.size()) {
|
|
const auto provisionalChunkSize = std::min(
|
|
kChunk,
|
|
int(textView.size() - i));
|
|
const auto chunkSize = [&] {
|
|
const auto until = std::max(
|
|
0,
|
|
provisionalChunkSize - ::Spellchecker::kMaxWordSize);
|
|
for (auto n = provisionalChunkSize; n > until; n--) {
|
|
if (textView.at(i + n - 1).isLetterOrNumber()) {
|
|
continue;
|
|
} else {
|
|
return n;
|
|
}
|
|
}
|
|
return provisionalChunkSize;
|
|
}();
|
|
const auto chunk = textView.mid(i, chunkSize);
|
|
|
|
chunkBuffer.resize(chunk.size() + 1);
|
|
const auto count = chunk.toWCharArray(chunkBuffer.data());
|
|
chunkBuffer[count] = '\0';
|
|
|
|
checkSpellingText(
|
|
(LPCWSTR)chunkBuffer.data(),
|
|
misspelledWords,
|
|
i);
|
|
i += chunk.size();
|
|
}
|
|
}
|
|
|
|
////// End of WindowsSpellChecker class.
|
|
|
|
WindowsSpellChecker &SharedSpellChecker() {
|
|
static auto spellchecker = WindowsSpellChecker();
|
|
return spellchecker;
|
|
}
|
|
|
|
} // namespace
|
|
|
|
// TODO: Add a better work with the Threading Models.
|
|
// All COM objects should be created asynchronously
|
|
// if we want to work with them asynchronously.
|
|
// Some calls can be made in the main thread before spellchecking
|
|
// (e.g. KnownLanguages), so we have to init it asynchronously first.
|
|
void Init() {
|
|
if (IsSystemSpellchecker()) {
|
|
crl::async(SharedSpellChecker);
|
|
}
|
|
}
|
|
|
|
bool IsSystemSpellchecker() {
|
|
// Windows 7 does not support spellchecking.
|
|
// https://docs.microsoft.com/en-us/windows/win32/api/spellcheck/nn-spellcheck-ispellchecker
|
|
return IsWindows8OrGreater();
|
|
}
|
|
|
|
std::vector<QString> ActiveLanguages() {
|
|
if (IsSystemSpellchecker()) {
|
|
return SharedSpellChecker().systemLanguages();
|
|
}
|
|
return ThirdParty::ActiveLanguages();
|
|
}
|
|
|
|
bool CheckSpelling(const QString &wordToCheck) {
|
|
if (!IsSystemSpellchecker()) {
|
|
return ThirdParty::CheckSpelling(wordToCheck);
|
|
}
|
|
return SharedSpellChecker().checkSpelling(Q2WString(wordToCheck));
|
|
}
|
|
|
|
void FillSuggestionList(
|
|
const QString &wrongWord,
|
|
std::vector<QString> *optionalSuggestions) {
|
|
if (IsSystemSpellchecker()) {
|
|
SharedSpellChecker().fillSuggestionList(
|
|
Q2WString(wrongWord),
|
|
optionalSuggestions);
|
|
return;
|
|
}
|
|
ThirdParty::FillSuggestionList(
|
|
wrongWord,
|
|
optionalSuggestions);
|
|
}
|
|
|
|
void AddWord(const QString &word) {
|
|
if (IsSystemSpellchecker()) {
|
|
SharedSpellChecker().addWord(Q2WString(word));
|
|
} else {
|
|
ThirdParty::AddWord(word);
|
|
}
|
|
}
|
|
|
|
void RemoveWord(const QString &word) {
|
|
if (IsSystemSpellchecker()) {
|
|
SharedSpellChecker().removeWord(Q2WString(word));
|
|
} else {
|
|
ThirdParty::RemoveWord(word);
|
|
}
|
|
}
|
|
|
|
void IgnoreWord(const QString &word) {
|
|
if (IsSystemSpellchecker()) {
|
|
SharedSpellChecker().ignoreWord(Q2WString(word));
|
|
} else {
|
|
ThirdParty::IgnoreWord(word);
|
|
}
|
|
}
|
|
|
|
bool IsWordInDictionary(const QString &wordToCheck) {
|
|
if (IsSystemSpellchecker()) {
|
|
// ISpellChecker can't check if a word is in the dictionary.
|
|
return false;
|
|
}
|
|
return ThirdParty::IsWordInDictionary(wordToCheck);
|
|
}
|
|
|
|
void UpdateLanguages(std::vector<int> languages) {
|
|
if (!IsSystemSpellchecker()) {
|
|
ThirdParty::UpdateLanguages(languages);
|
|
return;
|
|
}
|
|
crl::async([=] {
|
|
const auto result = ActiveLanguages();
|
|
crl::on_main([=] {
|
|
::Spellchecker::UpdateSupportedScripts(result);
|
|
});
|
|
});
|
|
}
|
|
|
|
void CheckSpellingText(
|
|
const QString &text,
|
|
MisspelledWords *misspelledWords) {
|
|
if (IsSystemSpellchecker()) {
|
|
// There are certain strings with a lot of 'paragraph separators'
|
|
// that crash the native Windows spellchecker. We replace them
|
|
// with spaces (no difference for the checking), they don't crash.
|
|
const auto check = QString(text).replace(QChar(8233), QChar(32));
|
|
if (check.size() > kChunk) {
|
|
// On some versions of Windows 10,
|
|
// checking large text with specific characters (e.g. @)
|
|
// will throw the std::regex_error::error_complexity exception,
|
|
// so we have to split the text.
|
|
SharedSpellChecker().chunkedCheckSpellingText(
|
|
check,
|
|
misspelledWords);
|
|
} else {
|
|
SharedSpellChecker().checkSpellingText(
|
|
(LPCWSTR)check.utf16(),
|
|
misspelledWords,
|
|
0);
|
|
}
|
|
|
|
return;
|
|
}
|
|
ThirdParty::CheckSpellingText(text, misspelledWords);
|
|
}
|
|
|
|
|
|
} // namespace Platform::Spellchecker
|