e89e7b4be2
Originally committed to SVN as r4051.
301 lines
7.7 KiB
C++
301 lines
7.7 KiB
C++
// Copyright (c) 2006, Rodrigo Braz Monteiro
|
|
// All rights reserved.
|
|
//
|
|
// Redistribution and use in source and binary forms, with or without
|
|
// modification, are permitted provided that the following conditions are met:
|
|
//
|
|
// * Redistributions of source code must retain the above copyright notice,
|
|
// this list of conditions and the following disclaimer.
|
|
// * Redistributions in binary form must reproduce the above copyright notice,
|
|
// this list of conditions and the following disclaimer in the documentation
|
|
// and/or other materials provided with the distribution.
|
|
// * Neither the name of the Aegisub Group nor the names of its contributors
|
|
// may be used to endorse or promote products derived from this software
|
|
// without specific prior written permission.
|
|
//
|
|
// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
|
|
// AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
|
|
// IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
|
|
// ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
|
|
// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
|
|
// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
|
|
// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
|
|
// INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
|
|
// CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
|
|
// ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
|
|
// POSSIBILITY OF SUCH DAMAGE.
|
|
//
|
|
// Aegisub Project http://www.aegisub.org/
|
|
//
|
|
// $Id$
|
|
|
|
/// @file spellchecker_hunspell.cpp
|
|
/// @brief Hunspell-based spell checker implementation
|
|
/// @ingroup spelling
|
|
///
|
|
|
|
|
|
///////////
|
|
// Headers
|
|
#include "config.h"
|
|
|
|
|
|
#ifdef WITH_HUNSPELL
|
|
|
|
#ifndef AGI_PRE
|
|
#include <wx/dir.h>
|
|
#include <wx/filename.h>
|
|
#include <wx/log.h>
|
|
#include <wx/txtstrm.h>
|
|
#include <wx/wfstream.h>
|
|
#endif
|
|
|
|
#include <hunspell/hunspell.hxx>
|
|
|
|
#include "charset_conv.h"
|
|
#include "options.h"
|
|
#include "spellchecker_hunspell.h"
|
|
#include "standard_paths.h"
|
|
#include "utils.h"
|
|
|
|
|
|
/// @brief Constructor
|
|
HunspellSpellChecker::HunspellSpellChecker() {
|
|
hunspell = NULL;
|
|
conv = NULL;
|
|
SetLanguage(Options.AsText(_T("Spell checker Language")));
|
|
}
|
|
|
|
|
|
|
|
/// @brief Destructor
|
|
HunspellSpellChecker::~HunspellSpellChecker() {
|
|
Reset();
|
|
}
|
|
|
|
|
|
|
|
/// @brief Reset spelling library
|
|
void HunspellSpellChecker::Reset() {
|
|
delete hunspell;
|
|
hunspell = NULL;
|
|
delete conv;
|
|
conv = NULL;
|
|
affpath.Clear();
|
|
dicpath.Clear();
|
|
}
|
|
|
|
|
|
|
|
/// @brief Can add to dictionary?
|
|
/// @param word Word to check.
|
|
/// @return Whether word can be added or not.
|
|
///
|
|
bool HunspellSpellChecker::CanAddWord(wxString word) {
|
|
if (!hunspell) return false;
|
|
wxCharBuffer buffer = word.mb_str(*conv);
|
|
return (buffer.data() != NULL);
|
|
}
|
|
|
|
|
|
|
|
/// @brief Add word to dictionary
|
|
/// @param word Word to add.
|
|
///
|
|
void HunspellSpellChecker::AddWord(wxString word) {
|
|
// Dictionary OK?
|
|
if (!hunspell) return;
|
|
|
|
// Add to currently loaded file
|
|
#ifdef WITH_OLD_HUNSPELL
|
|
hunspell->put_word(word.mb_str(*conv));
|
|
#else
|
|
hunspell->add(word.mb_str(*conv));
|
|
#endif
|
|
|
|
// Ensure that the path exists
|
|
wxFileName fn(usrdicpath);
|
|
if (!fn.DirExists()) {
|
|
wxFileName::Mkdir(fn.GetPath());
|
|
}
|
|
|
|
// Load dictionary
|
|
wxArrayString dic;
|
|
wxString curLine;
|
|
bool added = false;
|
|
if (fn.FileExists()) { // Even if you ever want to remove this "if", keep the braces, so the stream closes at the end
|
|
bool first = true;
|
|
wxFileInputStream in(usrdicpath);
|
|
if (!in.IsOk()) return;
|
|
wxTextInputStream textIn(in,_T(" \t"),*conv);
|
|
|
|
// Read it
|
|
while (in.CanRead() && !in.Eof()) {
|
|
// Read line
|
|
curLine = textIn.ReadLine();
|
|
curLine.Trim();
|
|
if (curLine.IsEmpty()) continue;
|
|
|
|
// First
|
|
if (first) {
|
|
first = false;
|
|
if (curLine.IsNumber()) continue;
|
|
}
|
|
|
|
// See if word to be added goes here
|
|
if (!added && curLine.Lower() > word.Lower()) {
|
|
dic.Add(word);
|
|
added = true;
|
|
}
|
|
|
|
// Add to memory dictionary
|
|
dic.Add(curLine);
|
|
}
|
|
}
|
|
|
|
// Not added yet
|
|
if (!added) dic.Add(word);
|
|
|
|
// Write back to disk
|
|
wxFileOutputStream out(usrdicpath);
|
|
if (!out.IsOk()) return;
|
|
wxTextOutputStream textOut(out,wxEOL_UNIX,*conv);
|
|
textOut.WriteString(wxString::Format(_T("%i"),dic.Count())+_T("\n"));
|
|
for (unsigned int i=0;i<dic.Count();i++) textOut.WriteString(dic[i]+_T("\n"));
|
|
}
|
|
|
|
|
|
|
|
/// @brief Check if the word is valid.
|
|
/// @param word Word to check
|
|
/// @return Whether word is valid or not.
|
|
///
|
|
bool HunspellSpellChecker::CheckWord(wxString word) {
|
|
if (!hunspell) return true;
|
|
wxCharBuffer buf = word.mb_str(*conv);
|
|
if (buf) return (hunspell->spell(buf) == 1);
|
|
return false;
|
|
}
|
|
|
|
|
|
|
|
/// @brief Get suggestions for word.
|
|
/// @param word Word to get suggestions for
|
|
/// @return List of suggestions
|
|
///
|
|
wxArrayString HunspellSpellChecker::GetSuggestions(wxString word) {
|
|
// Array
|
|
wxArrayString suggestions;
|
|
|
|
// Get suggestions
|
|
if (hunspell) {
|
|
// Word
|
|
wxCharBuffer buf = word.mb_str(*conv);
|
|
if (!buf) return suggestions;
|
|
|
|
// Grab raw from Hunspell
|
|
char **results;
|
|
int n = hunspell->suggest(&results,buf);
|
|
|
|
// Convert each
|
|
for (int i=0;i<n;i++) {
|
|
wxString current(results[i],*conv);
|
|
suggestions.Add(current);
|
|
delete results[i];
|
|
}
|
|
|
|
// Delete
|
|
delete results;
|
|
}
|
|
|
|
// Return them
|
|
return suggestions;
|
|
}
|
|
|
|
|
|
|
|
/// @brief Get list of available dictionaries.
|
|
/// @return List of available dictionaries
|
|
///
|
|
wxArrayString HunspellSpellChecker::GetLanguageList() {
|
|
// Get dir name
|
|
wxString path = StandardPaths::DecodePathMaybeRelative(Options.AsText(_T("Dictionaries path")), _T("?data")) + _T("/");
|
|
wxArrayString list;
|
|
wxFileName folder(path);
|
|
if (!folder.DirExists()) return list;
|
|
|
|
// Get file lists
|
|
wxArrayString dic;
|
|
wxDir::GetAllFiles(path,&dic,_T("*.dic"),wxDIR_FILES);
|
|
wxArrayString aff;
|
|
wxDir::GetAllFiles(path,&aff,_T("*.aff"),wxDIR_FILES);
|
|
|
|
// For each dictionary match, see if it can find the corresponding .aff
|
|
for (unsigned int i=0;i<dic.Count();i++) {
|
|
wxString curAff = dic[i].Left(dic[i].Length()-4) + _T(".aff");
|
|
for (unsigned int j=0;j<aff.Count();j++) {
|
|
// Found match
|
|
if (curAff == aff[j]) {
|
|
wxFileName fname(curAff);
|
|
list.Add(fname.GetName());
|
|
break;
|
|
}
|
|
}
|
|
}
|
|
|
|
// Return list
|
|
return list;
|
|
}
|
|
|
|
|
|
|
|
/// @brief Set language.
|
|
/// @param language Language to set
|
|
///
|
|
void HunspellSpellChecker::SetLanguage(wxString language) {
|
|
// Unload
|
|
Reset();
|
|
if (language.IsEmpty()) return;
|
|
|
|
// Get dir name
|
|
//FIXME: this should use ?user instead of ?data; however, since it apparently works already on win32, I'm not gonna mess with it right now :p
|
|
wxString path = StandardPaths::DecodePathMaybeRelative(Options.AsText(_T("Dictionaries path")), _T("?data")) + _T("/");
|
|
wxString userPath = StandardPaths::DecodePath(_T("?user/dictionaries/user_"));
|
|
|
|
// Get affix and dictionary paths
|
|
affpath = wxString::Format("%s%s.aff", path, language);
|
|
dicpath = wxString::Format("%s%s.dic", path, language);
|
|
usrdicpath = wxString::Format("%s%s.dic", userPath, language);
|
|
|
|
wxLogDebug("Using dictionary: %ls", dicpath);
|
|
|
|
// Check if language is available
|
|
if (!wxFileExists(affpath) || !wxFileExists(dicpath)) return;
|
|
|
|
// Load
|
|
hunspell = new Hunspell(affpath.mb_str(csConvLocal),dicpath.mb_str(csConvLocal));
|
|
conv = NULL;
|
|
if (hunspell) {
|
|
conv = new AegisubCSConv(wxString(hunspell->get_dic_encoding(),wxConvUTF8));
|
|
|
|
// Load user dictionary
|
|
if (wxFileExists(usrdicpath)) {
|
|
wxFileInputStream in(usrdicpath);
|
|
if (!in.IsOk()) return;
|
|
wxTextInputStream textIn(in,_T(" \t"),*conv);
|
|
while (in.CanRead() && !in.Eof()) {
|
|
// Read line
|
|
wxString curLine = textIn.ReadLine();
|
|
curLine.Trim();
|
|
if (curLine.IsEmpty() || curLine.IsNumber()) continue;
|
|
#ifdef WITH_OLD_HUNSPELL
|
|
hunspell->put_word(curLine.mb_str(*conv));
|
|
#else
|
|
hunspell->add(curLine.mb_str(*conv));
|
|
#endif
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
#endif // WITH_HUNSPELL
|