- std::vector<char> const encoded =
- ucs4_to_eightbit(s.data(), s.length(), encoding);
- return string(encoded.begin(), encoded.end());
+ FileName base(path);
+ if (!base.isDirectory()) {
+ return make_pair(string(), string());
+ }
+ FileNameList const idx_files = base.dirList("idx");
+ FileNameList const data_files = base.dirList("dat");
+ string idx;
+ string data;
+ string basename;
+
+ LYXERR(Debug::FILES, "thesaurus path: " << path);
+ for (FileNameList::const_iterator it = idx_files.begin(); it != idx_files.end(); ++it) {
+ basename = it->onlyFileNameWithoutExt();
+ if (contains(basename, to_ascii(lang))) {
+ ifstream ifs(it->absFileName().c_str());
+ if (ifs) {
+ // check for appropriate version of index file
+ string encoding; // first line is encoding
+ int items = 0; // second line is no. of items
+ getline(ifs,encoding);
+ ifs >> items;
+ if (ifs.fail()) {
+ LYXERR(Debug::FILES, "ignore irregular thesaurus idx file: " << it->absFileName());
+ continue;
+ }
+ if (encoding.length() == 0 || encoding.find_first_of(',') != string::npos) {
+ LYXERR(Debug::FILES, "ignore version1 thesaurus idx file: " << it->absFileName());
+ continue;
+ }
+ }
+ idx = it->absFileName();
+ LYXERR(Debug::FILES, "selected thesaurus idx file: " << idx);
+ break;
+ }
+ }
+ if (idx.empty())
+ return make_pair(string(), string());
+ for (support::FileNameList::const_iterator it = data_files.begin(); it != data_files.end(); ++it) {
+ if (contains(it->onlyFileName(), basename)) {
+ data = it->absFileName();
+ LYXERR(Debug::FILES, "selected thesaurus data file: " << data);
+ break;
+ }
+ }
+ return make_pair(idx, data);