mirror of
https://github.com/amyinspace/MagicSetEditor2.git
synced 2026-06-12 21:47:00 -04:00
Simple spelling checker using the Hunspell library.
This time adding the source files :) The checker is used (experimentally) by the magic game file. git-svn-id: svn://svn.code.sf.net/p/magicseteditor/code/trunk@1262 0fc631ac-6414-0410-93d0-97cfa31319b6
This commit is contained in:
@@ -4,6 +4,7 @@
|
|||||||
languages := [
|
languages := [
|
||||||
English: [
|
English: [
|
||||||
code : "en",
|
code : "en",
|
||||||
|
spellcheck_code : "en_US",
|
||||||
pt_separator : "/",
|
pt_separator : "/",
|
||||||
type_separator : " — ",
|
type_separator : " — ",
|
||||||
subtype_separator : " ",
|
subtype_separator : " ",
|
||||||
@@ -17,6 +18,7 @@ languages := [
|
|||||||
|
|
||||||
Français: [
|
Français: [
|
||||||
code : "fr",
|
code : "fr",
|
||||||
|
spellcheck_code : "", # TODO: get dictionary
|
||||||
pt_separator : "/",
|
pt_separator : "/",
|
||||||
type_separator : " : "
|
type_separator : " : "
|
||||||
subtype_separator : "<atom-sep> et </atom-sep>",
|
subtype_separator : "<atom-sep> et </atom-sep>",
|
||||||
|
|||||||
@@ -322,8 +322,8 @@ mana_context :=
|
|||||||
|adds?|pay(ed)?[ ](with|using)
|
|adds?|pay(ed)?[ ](with|using)
|
||||||
)
|
)
|
||||||
([ ]either)? # pay either X or Y
|
([ ]either)? # pay either X or Y
|
||||||
([ ]<sym[^>]*>[STQXYZIWUBRG0-9/|]+</sym[^>]*>,)* # pay X, Y or Z
|
([ ](<sym[^>]*>)?[STQXYZIWUBRG0-9/|]+(</sym[^>]*>)?,)* # pay X, Y or Z
|
||||||
([ ]<sym[^>]*>[STQXYZIWUBRG0-9/|]+</sym[^>]*>[ ](and|or|and/or))* # pay X or Y
|
([ ](<sym[^>]*>)?[STQXYZIWUBRG0-9/|]+(</sym[^>]*>)?[ ](and|or|and/or))* # pay X or Y
|
||||||
[ ]<match>
|
[ ]<match>
|
||||||
([,.)]|$ # (end of word)
|
([,.)]|$ # (end of word)
|
||||||
|[ ][^ .,]*$ # still typing...
|
|[ ][^ .,]*$ # still typing...
|
||||||
@@ -343,6 +343,7 @@ text_filter :=
|
|||||||
# step 1 : remove all automatic tags
|
# step 1 : remove all automatic tags
|
||||||
remove_tag@(tag: "<sym-auto>") +
|
remove_tag@(tag: "<sym-auto>") +
|
||||||
remove_tag@(tag: "<i-auto>") +
|
remove_tag@(tag: "<i-auto>") +
|
||||||
|
remove_tag@(tag: "<error-spelling") +
|
||||||
# step 2 : reminder text for keywords
|
# step 2 : reminder text for keywords
|
||||||
expand_keywords@(
|
expand_keywords@(
|
||||||
condition: {
|
condition: {
|
||||||
@@ -392,7 +393,7 @@ text_filter :=
|
|||||||
replace: {"<nosym>" + mana_filter_t() + "</nosym>"} ) +
|
replace: {"<nosym>" + mana_filter_t() + "</nosym>"} ) +
|
||||||
# step 5 : add mana & tap symbols
|
# step 5 : add mana & tap symbols
|
||||||
replace@(
|
replace@(
|
||||||
match: "\b[STQXYZIWUBRG0-9/|]+\b",
|
match: "\\b[STQXYZIWUBRG0-9/|]+\\b",
|
||||||
in_context: mana_context,
|
in_context: mana_context,
|
||||||
replace: {"<sym-auto>" + mana_filter_t() + "</sym-auto>"} ) +
|
replace: {"<sym-auto>" + mana_filter_t() + "</sym-auto>"} ) +
|
||||||
# step 5b : add explict mana symbols
|
# step 5b : add explict mana symbols
|
||||||
@@ -410,7 +411,9 @@ text_filter :=
|
|||||||
+ "([[:lower:]])" # match this
|
+ "([[:lower:]])" # match this
|
||||||
+ "(?![)])", # not followed by this
|
+ "(?![)])", # not followed by this
|
||||||
replace: { _1 + to_upper(_2) }) +
|
replace: { _1 + to_upper(_2) }) +
|
||||||
curly_quotes
|
curly_quotes +
|
||||||
|
# step 9 : spellcheck
|
||||||
|
{ check_spelling(language:language().spellcheck_code) }
|
||||||
|
|
||||||
|
|
||||||
############################################################## Other boxes
|
############################################################## Other boxes
|
||||||
@@ -423,7 +426,9 @@ flavor_text_filter :=
|
|||||||
# step 2 : surround by <i> tags
|
# step 2 : surround by <i> tags
|
||||||
{ "<i-flavor>" + input + "</i-flavor>" } +
|
{ "<i-flavor>" + input + "</i-flavor>" } +
|
||||||
# curly quotes
|
# curly quotes
|
||||||
curly_quotes
|
curly_quotes +
|
||||||
|
# spellcheck
|
||||||
|
{ check_spelling(language:language().spellcheck_code) }
|
||||||
|
|
||||||
# Move the cursor past the separator in the p/t and type boxes
|
# Move the cursor past the separator in the p/t and type boxes
|
||||||
type_over_pt := replace@(match:"/$", replace:"")
|
type_over_pt := replace@(match:"/$", replace:"")
|
||||||
|
|||||||
@@ -0,0 +1,92 @@
|
|||||||
|
|
||||||
|
//+----------------------------------------------------------------------------+
|
||||||
|
//| Description: Magic Set Editor - Program to make Magic (tm) cards |
|
||||||
|
//| Copyright: (C) 2001 - 2008 Twan van Laarhoven and "coppro" |
|
||||||
|
//| License: GNU General Public License 2 or later (see file COPYING) |
|
||||||
|
//+----------------------------------------------------------------------------+
|
||||||
|
|
||||||
|
// ----------------------------------------------------------------------------- : Includes
|
||||||
|
|
||||||
|
#include <util/prec.hpp>
|
||||||
|
#include <script/functions/functions.hpp>
|
||||||
|
#include <script/functions/util.hpp>
|
||||||
|
#include <util/spell_checker.hpp>
|
||||||
|
#include <util/tagged_string.hpp>
|
||||||
|
|
||||||
|
// ----------------------------------------------------------------------------- : Functions
|
||||||
|
|
||||||
|
void check_word(const String& input, String& out, size_t start, size_t end, SpellChecker& checker, bool must_be_empty) {
|
||||||
|
if (start >= end) return;
|
||||||
|
String word = untag(input.substr(start,end-start));
|
||||||
|
// TODO: handle keywords and cardname references
|
||||||
|
bool error = !word.empty() && (must_be_empty || !checker.spell_with_punctuation(word));
|
||||||
|
if (error) out += _("<error-spelling>");
|
||||||
|
out.append(input, start, end-start);
|
||||||
|
if (error) out += _("</error-spelling>");
|
||||||
|
}
|
||||||
|
|
||||||
|
SCRIPT_FUNCTION(check_spelling) {
|
||||||
|
SCRIPT_PARAM(String,language);
|
||||||
|
SCRIPT_PARAM(String,input);
|
||||||
|
if (language.empty()) {
|
||||||
|
// no language -> spelling checking
|
||||||
|
SCRIPT_RETURN(true);
|
||||||
|
}
|
||||||
|
SpellChecker& checker = SpellChecker::get(language);
|
||||||
|
// remove old spelling error tags
|
||||||
|
input = remove_tag(input, _("<error-spelling"));
|
||||||
|
// now walk over the words in the input, and mark misspellings
|
||||||
|
String result;
|
||||||
|
size_t word_start = 0, pos = 0;
|
||||||
|
bool must_be_empty = false; // must this word be empty?
|
||||||
|
while (pos < input.size()) {
|
||||||
|
Char c = input.GetChar(pos);
|
||||||
|
if (c == _('<')) {
|
||||||
|
if (is_substr(input,pos,_("<sym"))) {
|
||||||
|
// before symbols should be empty
|
||||||
|
check_word(input,result, word_start,pos, checker, true);
|
||||||
|
// don't spellcheck symbols
|
||||||
|
word_start = pos;
|
||||||
|
pos = min(input.size(), match_close_tag_end(input,pos));
|
||||||
|
result.append(input, word_start, pos-word_start);
|
||||||
|
word_start = pos;
|
||||||
|
must_be_empty = true; // need a space after symbols
|
||||||
|
} else {
|
||||||
|
pos = skip_tag(input,pos);
|
||||||
|
}
|
||||||
|
} else if (isSpace(c)) {
|
||||||
|
// word boundary -> check word
|
||||||
|
check_word(input,result, word_start,pos, checker, must_be_empty);
|
||||||
|
// next
|
||||||
|
result += c;
|
||||||
|
pos++;
|
||||||
|
word_start = pos;
|
||||||
|
must_be_empty = false;
|
||||||
|
} else {
|
||||||
|
pos++;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
// last word
|
||||||
|
check_word(input,result, word_start,input.size(), checker, must_be_empty);
|
||||||
|
// done
|
||||||
|
SCRIPT_RETURN(result);
|
||||||
|
}
|
||||||
|
|
||||||
|
SCRIPT_FUNCTION(check_spelling_word) {
|
||||||
|
SCRIPT_PARAM(String,language);
|
||||||
|
SCRIPT_PARAM(String,input);
|
||||||
|
if (language.empty()) {
|
||||||
|
// no language -> spelling checking
|
||||||
|
SCRIPT_RETURN(true);
|
||||||
|
} else {
|
||||||
|
bool correct = SpellChecker::get(language).spell(input);
|
||||||
|
SCRIPT_RETURN(correct);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
// ----------------------------------------------------------------------------- : Init
|
||||||
|
|
||||||
|
void init_script_spelling_functions(Context& ctx) {
|
||||||
|
ctx.setVariable(_("check spelling"), script_check_spelling);
|
||||||
|
ctx.setVariable(_("check spelling word"), script_check_spelling_word);
|
||||||
|
}
|
||||||
@@ -0,0 +1,60 @@
|
|||||||
|
//+----------------------------------------------------------------------------+
|
||||||
|
//| Description: Magic Set Editor - Program to make Magic (tm) cards |
|
||||||
|
//| Copyright: (C) 2001 - 2008 Twan van Laarhoven and "coppro" |
|
||||||
|
//| License: GNU General Public License 2 or later (see file COPYING) |
|
||||||
|
//+----------------------------------------------------------------------------+
|
||||||
|
|
||||||
|
// ----------------------------------------------------------------------------- : Includes
|
||||||
|
|
||||||
|
#include <util/prec.hpp>
|
||||||
|
#include <util/spell_checker.hpp>
|
||||||
|
#include <util/io/package_manager.hpp>
|
||||||
|
|
||||||
|
// ----------------------------------------------------------------------------- : Spell checker : construction
|
||||||
|
|
||||||
|
map<String,SpellCheckerP> SpellChecker::spellers;
|
||||||
|
|
||||||
|
SpellChecker& SpellChecker::get(const String& language) {
|
||||||
|
SpellCheckerP& speller = spellers[language];
|
||||||
|
if (!speller) {
|
||||||
|
String local_dir = package_manager.getDictionaryDir(true);
|
||||||
|
String global_dir = package_manager.getDictionaryDir(false);
|
||||||
|
String aff_path = language + _(".aff");
|
||||||
|
String dic_path = language + _(".dic");
|
||||||
|
if (wxFileExists(local_dir + aff_path) && wxFileExists(local_dir + dic_path)) {
|
||||||
|
speller = SpellCheckerP(new SpellChecker((local_dir + aff_path).mb_str(),
|
||||||
|
(local_dir + dic_path).mb_str()));
|
||||||
|
} else if (wxFileExists(global_dir + aff_path) && wxFileExists(global_dir + dic_path)) {
|
||||||
|
speller = SpellCheckerP(new SpellChecker((global_dir + aff_path).mb_str(),
|
||||||
|
(global_dir + dic_path).mb_str()));
|
||||||
|
} else {
|
||||||
|
throw Error(_("Dictionary not found for language: ") + language);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
return *speller;
|
||||||
|
}
|
||||||
|
|
||||||
|
SpellChecker::SpellChecker(const char* aff_path, const char* dic_path)
|
||||||
|
: Hunspell(aff_path,dic_path)
|
||||||
|
, encoding(String(get_dic_encoding(), IF_UNICODE(wxConvLibc, wxSTRING_MAXLEN)))
|
||||||
|
{}
|
||||||
|
|
||||||
|
void SpellChecker::destroy() {
|
||||||
|
spellers.clear();
|
||||||
|
}
|
||||||
|
|
||||||
|
// ----------------------------------------------------------------------------- : Spell checker : use
|
||||||
|
|
||||||
|
bool SpellChecker::spell(const String& word) {
|
||||||
|
return Hunspell::spell(word.mb_str(encoding));
|
||||||
|
}
|
||||||
|
|
||||||
|
const String word_start = String(_("[({\"\'")) + LEFT_SINGLE_QUOTE + LEFT_DOUBLE_QUOTE;
|
||||||
|
const String word_end = String(_("])}.,;:\"\'")) + RIGHT_SINGLE_QUOTE + RIGHT_DOUBLE_QUOTE;
|
||||||
|
|
||||||
|
bool SpellChecker::spell_with_punctuation(const String& word) {
|
||||||
|
size_t first = word.find_first_not_of(word_start);
|
||||||
|
size_t last = word.find_last_not_of(word_end);
|
||||||
|
if (first > last) return false; // just punctuation is incorrect
|
||||||
|
return spell(word.substr(first, last-first+1));
|
||||||
|
}
|
||||||
@@ -0,0 +1,42 @@
|
|||||||
|
//+----------------------------------------------------------------------------+
|
||||||
|
//| Description: Magic Set Editor - Program to make Magic (tm) cards |
|
||||||
|
//| Copyright: (C) 2001 - 2008 Twan van Laarhoven and "coppro" |
|
||||||
|
//| License: GNU General Public License 2 or later (see file COPYING) |
|
||||||
|
//+----------------------------------------------------------------------------+
|
||||||
|
|
||||||
|
#ifndef HEADER_UTIL_SPELL_CHECKER
|
||||||
|
#define HEADER_UTIL_SPELL_CHECKER
|
||||||
|
|
||||||
|
// ----------------------------------------------------------------------------- : Includes
|
||||||
|
|
||||||
|
#include <util/prec.hpp>
|
||||||
|
#include "hunspell.hxx"
|
||||||
|
|
||||||
|
DECLARE_POINTER_TYPE(SpellChecker);
|
||||||
|
|
||||||
|
// ----------------------------------------------------------------------------- : Spell checker
|
||||||
|
|
||||||
|
/// A spelling checker for a particular language
|
||||||
|
class SpellChecker : public Hunspell, public IntrusivePtrBase<SpellChecker> {
|
||||||
|
public:
|
||||||
|
/// Get a SpellChecker object for the given language.
|
||||||
|
/** Note: This is not threadsafe yet */
|
||||||
|
static SpellChecker& get(const String& language);
|
||||||
|
/// Destroy all cached SpellChecker objects
|
||||||
|
static void destroy();
|
||||||
|
|
||||||
|
/// Check the spelling of a single word
|
||||||
|
bool spell(const String& word);
|
||||||
|
/// Check the spelling of a single word, ignore punctuation
|
||||||
|
bool spell_with_punctuation(const String& word);
|
||||||
|
|
||||||
|
private:
|
||||||
|
/// Convert between String and dictionary encoding
|
||||||
|
wxCSConv encoding;
|
||||||
|
|
||||||
|
SpellChecker(const char* aff_path, const char* dic_path);
|
||||||
|
static map<String,SpellCheckerP> spellers; //< Cached checkers for each language
|
||||||
|
};
|
||||||
|
|
||||||
|
// ----------------------------------------------------------------------------- : EOF
|
||||||
|
#endif
|
||||||
Reference in New Issue
Block a user