X-Git-Url: https://git.lyx.org/gitweb/?a=blobdiff_plain;f=src%2FHunspellChecker.cpp;h=01ec19498b70e28075db5e5b8a9c6bb8c4c77e49;hb=4ed0312c51704780af1c452d3a82a84171b3725a;hp=2105e7b93f84fff912d3e8e0d8f8a96262eaa055;hpb=4ba2c362cbb9b8968378ecca49616402622e5825;p=lyx.git diff --git a/src/HunspellChecker.cpp b/src/HunspellChecker.cpp index 2105e7b93f..01ec19498b 100644 --- a/src/HunspellChecker.cpp +++ b/src/HunspellChecker.cpp @@ -16,17 +16,13 @@ #include "LyXRC.h" #include "WordLangTuple.h" -#include "frontends/alert.h" - #include "support/debug.h" #include "support/docstring_list.h" #include "support/filetools.h" #include "support/Package.h" #include "support/FileName.h" -#include "support/gettext.h" #include "support/lassert.h" #include "support/lstrings.h" -#include "support/os.h" #include @@ -45,9 +41,14 @@ namespace { typedef map Spellers; typedef map LangPersonalWordList; -typedef vector IgnoreList; +docstring remap_result(docstring const & s) +{ + // substitute RIGHT SINGLE QUOTATION MARK + // by APOSTROPHE + return subst(s, 0x2019, 0x0027); +} -} // anon namespace +} // namespace struct HunspellChecker::Private @@ -55,13 +56,17 @@ struct HunspellChecker::Private Private(); ~Private(); + void cleanCache(); + void setUserPath(std::string const & path); const string dictPath(int selector); bool haveLanguageFiles(string const & hpath); bool haveDictionary(Language const * lang, string & hpath); bool haveDictionary(Language const * lang); + int numDictionaries() const; Hunspell * addSpeller(Language const * lang, string & hpath); Hunspell * addSpeller(Language const * lang); Hunspell * speller(Language const * lang); + Hunspell * lookup(Language const * lang); /// ignored words bool isIgnored(WordLangTuple const & wl) const; /// personal word list interface @@ -71,36 +76,66 @@ struct HunspellChecker::Private /// the spellers Spellers spellers_; /// - IgnoreList ignored_; + WordLangTable ignored_; /// LangPersonalWordList personal_; + /// + std::string user_path_; /// the location below system/user directory /// there the aff+dic files lookup will happen const string dictDirectory(void) const { return "dicts"; } - int maxLookupSelector(void) const { return 3; } + int maxLookupSelector(void) const { return 5; } + const string HunspellDictionaryName(Language const * lang) { + return lang->variety().empty() + ? lang->code() + : lang->code() + "-" + lang->variety(); + } + const string myspellPackageDictDirectory(void) { + return "/usr/share/myspell"; + } + const string hunspellPackageDictDirectory(void) { + return "/usr/share/hunspell"; + } }; HunspellChecker::Private::Private() { + setUserPath(lyxrc.hunspelldir_path); } HunspellChecker::Private::~Private() +{ + cleanCache(); +} + + +void HunspellChecker::Private::setUserPath(std::string const & path) +{ + if (user_path_ != lyxrc.hunspelldir_path) { + cleanCache(); + user_path_ = path; + } +} + + +void HunspellChecker::Private::cleanCache() { Spellers::iterator it = spellers_.begin(); Spellers::iterator end = spellers_.end(); for (; it != end; ++it) { - if ( 0 != it->second) delete it->second; + delete it->second; + it->second = nullptr; } LangPersonalWordList::const_iterator pdit = personal_.begin(); LangPersonalWordList::const_iterator pdet = personal_.end(); for (; pdit != pdet; ++pdit) { - if ( 0 == pdit->second) + if (pdit->second == nullptr) continue; PersonalWordList * pd = pdit->second; pd->save(); @@ -120,42 +155,44 @@ bool HunspellChecker::Private::haveLanguageFiles(string const & hpath) const string HunspellChecker::Private::dictPath(int selector) { switch (selector) { + case 4: + return hunspellPackageDictDirectory(); + case 3: + return myspellPackageDictDirectory(); case 2: return addName(package().system_support().absFileName(),dictDirectory()); - break; case 1: return addName(package().user_support().absFileName(),dictDirectory()); - break; default: - return lyxrc.hunspelldir_path; + return user_path_; } } bool HunspellChecker::Private::haveDictionary(Language const * lang, string & hpath) { - if (hpath.empty()) { + if (hpath.empty() || !lang) return false; - } - LYXERR(Debug::FILES, "check hunspell path: " << hpath << " for language " << lang); - string h_path = addName(hpath, lang->code() + "-" + lang->variety()); + if (lookup(lang)) return true; + + string d_name = HunspellDictionaryName(lang); + + LYXERR(Debug::FILES, "check hunspell path: " << hpath + << " for language " << lang->lang() << " with name " << d_name); + + string h_path = addName(hpath, d_name); // first we try lang code+variety - if (!lang->variety().empty() && haveLanguageFiles(h_path)) { - hpath = h_path; - return true; - } - // next we try lang code only - h_path = addName(hpath, lang->code()); if (haveLanguageFiles(h_path)) { + LYXERR(Debug::FILES, " found " << h_path); hpath = h_path; return true; } - // last try with '_' replaced by '-' + // another try with code, '_' replaced by '-' h_path = addName(hpath, subst(lang->code(), '_', '-')); - if (!haveLanguageFiles(h_path)) { + if (!haveLanguageFiles(h_path)) return false; - } + LYXERR(Debug::FILES, " found " << h_path); hpath = h_path; return true; } @@ -164,52 +201,57 @@ bool HunspellChecker::Private::haveDictionary(Language const * lang, string & hp bool HunspellChecker::Private::haveDictionary(Language const * lang) { bool result = false; - for ( int p = 0; !result && p < maxLookupSelector(); p++ ) { + + setUserPath(lyxrc.hunspelldir_path); + for (int p = 0; !result && p < maxLookupSelector(); ++p) { string lpath = dictPath(p); result = haveDictionary(lang, lpath); } - // FIXME: if result is false... - // we should indicate somehow that this language is not - // supported, probably by popping a warning. But we'll need to - // remember which warnings we've issued. return result; } Hunspell * HunspellChecker::Private::speller(Language const * lang) { - Spellers::iterator it = spellers_.find(lang->id()); - if (it != spellers_.end()) - return it->second; + Hunspell * h = lookup(lang); + if (h) return h; + setUserPath(lyxrc.hunspelldir_path); return addSpeller(lang); } -Hunspell * HunspellChecker::Private::addSpeller(Language const * lang,string & path) +Hunspell * HunspellChecker::Private::lookup(Language const * lang) +{ + Spellers::iterator it = spellers_.find(lang->lang()); + return it != spellers_.end() ? it->second : nullptr; +} + + +Hunspell * HunspellChecker::Private::addSpeller(Language const * lang, string & path) { if (!haveDictionary(lang, path)) { - spellers_[lang->id()] = 0; - return 0; + spellers_[lang->lang()] = nullptr; + return nullptr; } FileName const affix(path + ".aff"); FileName const dict(path + ".dic"); Hunspell * h = new Hunspell(affix.absFileName().c_str(), dict.absFileName().c_str()); - LYXERR(Debug::FILES, "Hunspell speller for langage " << lang << " at " << dict << " found"); - spellers_[lang->id()] = h; + LYXERR(Debug::FILES, "Hunspell speller for langage " << lang << " at " << dict << " added."); + spellers_[lang->lang()] = h; return h; } Hunspell * HunspellChecker::Private::addSpeller(Language const * lang) { - Hunspell * h = 0; - for ( int p = 0; p < maxLookupSelector() && 0 == h; p++ ) { + Hunspell * h = nullptr; + for (int p = 0; p < maxLookupSelector() && nullptr == h; ++p) { string lpath = dictPath(p); h = addSpeller(lang, lpath); } - if (0 != h) { + if (h) { string const encoding = h->get_dic_encoding(); PersonalWordList * pd = new PersonalWordList(lang->lang()); pd->load(); @@ -225,13 +267,25 @@ Hunspell * HunspellChecker::Private::addSpeller(Language const * lang) } +int HunspellChecker::Private::numDictionaries() const +{ + int result = 0; + Spellers::const_iterator it = spellers_.begin(); + Spellers::const_iterator et = spellers_.end(); + + for (; it != et; ++it) + result += it->second != nullptr; + return result; +} + + bool HunspellChecker::Private::isIgnored(WordLangTuple const & wl) const { - IgnoreList::const_iterator it = ignored_.begin(); + WordLangTable::const_iterator it = ignored_.begin(); for (; it != ignored_.end(); ++it) { - if ((*it).lang()->code() != wl.lang()->code()) + if (it->lang()->code() != wl.lang()->code()) continue; - if ((*it).word() == wl.word()) + if (it->word() == wl.word()) return true; } return false; @@ -277,9 +331,9 @@ bool HunspellChecker::Private::learned(WordLangTuple const & wl) } -HunspellChecker::HunspellChecker(): d(new Private) -{ -} +HunspellChecker::HunspellChecker() + : d(new Private) +{} HunspellChecker::~HunspellChecker() @@ -288,29 +342,44 @@ HunspellChecker::~HunspellChecker() } -SpellChecker::Result HunspellChecker::check(WordLangTuple const & wl) +SpellChecker::Result HunspellChecker::check(WordLangTuple const & wl, + vector const & docdict) { if (d->isIgnored(wl)) return WORD_OK; + WordLangTable::const_iterator it = docdict.begin(); + for (; it != docdict.end(); ++it) { + if (it->lang()->code() != wl.lang()->code()) + continue; + if (it->word() == wl.word()) + return DOCUMENT_LEARNED_WORD; + } + Hunspell * h = d->speller(wl.lang()); if (!h) - return WORD_OK; + return NO_DICTIONARY; int info; string const encoding = h->get_dic_encoding(); string const word_to_check = to_iconv_encoding(wl.word(), encoding); + LYXERR(Debug::GUI, "spellCheck: \"" << + wl.word() << "\", lang = " << wl.lang()->lang()) ; +#ifdef HAVE_HUNSPELL_CXXABI + if (h->spell(word_to_check, &info)) +#else if (h->spell(word_to_check.c_str(), &info)) +#endif return d->learned(wl) ? LEARNED_WORD : WORD_OK; if (info & SPELL_COMPOUND) { // FIXME: What to do with that? - LYXERR(Debug::FILES, "Hunspell compound word found " << word_to_check); + LYXERR(Debug::GUI, "Hunspell compound word found " << word_to_check); } if (info & SPELL_FORBIDDEN) { // This was removed from personal dictionary - LYXERR(Debug::FILES, "Hunspell explicit forbidden word found " << word_to_check); + LYXERR(Debug::GUI, "Hunspell explicit forbidden word found " << word_to_check); } return UNKNOWN_WORD; @@ -356,13 +425,44 @@ void HunspellChecker::suggest(WordLangTuple const & wl, return; string const encoding = h->get_dic_encoding(); string const word_to_check = to_iconv_encoding(wl.word(), encoding); +#ifdef HAVE_HUNSPELL_CXXABI + vector wlst = h->suggest(word_to_check); + for (auto const & s : wlst) + suggestions.push_back(remap_result(from_iconv_encoding(s, encoding))); +#else char ** suggestion_list; int const suggestion_number = h->suggest(&suggestion_list, word_to_check.c_str()); + if (suggestion_number <= 0) + return; + for (int i = 0; i != suggestion_number; ++i) + suggestions.push_back(remap_result(from_iconv_encoding(suggestion_list[i], encoding))); + h->free_list(&suggestion_list, suggestion_number); +#endif +} + + +void HunspellChecker::stem(WordLangTuple const & wl, + docstring_list & suggestions) +{ + suggestions.clear(); + Hunspell * h = d->speller(wl.lang()); + if (!h) + return; + string const encoding = h->get_dic_encoding(); + string const word_to_check = to_iconv_encoding(wl.word(), encoding); +#ifdef HAVE_HUNSPELL_CXXABI + vector wlst = h->stem(word_to_check); + for (auto const & s : wlst) + suggestions.push_back(from_iconv_encoding(s, encoding)); +#else + char ** suggestion_list; + int const suggestion_number = h->stem(&suggestion_list, word_to_check.c_str()); if (suggestion_number <= 0) return; for (int i = 0; i != suggestion_number; ++i) suggestions.push_back(from_iconv_encoding(suggestion_list[i], encoding)); h->free_list(&suggestion_list, suggestion_number); +#endif } @@ -370,7 +470,13 @@ bool HunspellChecker::hasDictionary(Language const * lang) const { if (!lang) return false; - return (d->haveDictionary(lang)); + return d->haveDictionary(lang); +} + + +int HunspellChecker::numDictionaries() const +{ + return d->numDictionaries(); }