forked from mia/Aegisub
792225317e
1. svn mv OverLua SSATool athenasub avisynth_prs kanamemo \ motiontracker prs traydict unit_test vsfilter devel/ * See r2749 for full description. Originally committed to SVN as r2755.
440 lines
12 KiB
C++
440 lines
12 KiB
C++
// Copyright (c) 2006, Rodrigo Braz Monteiro
|
|
// All rights reserved.
|
|
//
|
|
// Redistribution and use in source and binary forms, with or without
|
|
// modification, are permitted provided that the following conditions are met:
|
|
//
|
|
// * Redistributions of source code must retain the above copyright notice,
|
|
// this list of conditions and the following disclaimer.
|
|
// * Redistributions in binary form must reproduce the above copyright notice,
|
|
// this list of conditions and the following disclaimer in the documentation
|
|
// and/or other materials provided with the distribution.
|
|
// * Neither the name of the TrayDict Group nor the names of its contributors
|
|
// may be used to endorse or promote products derived from this software
|
|
// without specific prior written permission.
|
|
//
|
|
// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
|
|
// AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
|
|
// IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
|
|
// ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
|
|
// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
|
|
// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
|
|
// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
|
|
// INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
|
|
// CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
|
|
// ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
|
|
// POSSIBILITY OF SUCH DAMAGE.
|
|
//
|
|
// -----------------------------------------------------------------------------
|
|
//
|
|
// TRAYDICT
|
|
//
|
|
// Website: http://aegisub.cellosoft.com
|
|
// Contact: mailto:zeratul@cellosoft.com
|
|
//
|
|
|
|
|
|
///////////
|
|
// Headers
|
|
#include "kana_table.h"
|
|
|
|
|
|
///////////////
|
|
// Constructor
|
|
KanaTable::KanaTable() {
|
|
level = 0;
|
|
groups[0] = 0;
|
|
groups[1] = 0;
|
|
|
|
BeginGroup();
|
|
Insert(L"\u3042",L"\u30a2",L"a");
|
|
Insert(L"\u3044",L"\u30a4",L"i");
|
|
Insert(L"\u3046",L"\u30a6",L"u");
|
|
Insert(L"\u3048",L"\u30a8",L"e");
|
|
Insert(L"\u304a",L"\u30aa",L"o");
|
|
|
|
BeginGroup();
|
|
Insert(L"\u304b",L"\u30ab",L"ka");
|
|
Insert(L"\u304d",L"\u30ad",L"ki");
|
|
Insert(L"\u304f",L"\u30af",L"ku");
|
|
Insert(L"\u3051",L"\u30b1",L"ke");
|
|
Insert(L"\u3053",L"\u30b3",L"ko");
|
|
|
|
BeginGroup();
|
|
Insert(L"\u3055",L"\u30b5",L"sa");
|
|
Insert(L"\u3057",L"\u30b7",L"shi");
|
|
Insert(L"\u3059",L"\u30b9",L"su");
|
|
Insert(L"\u305b",L"\u30bb",L"se");
|
|
Insert(L"\u305d",L"\u30bd",L"so");
|
|
|
|
BeginGroup();
|
|
Insert(L"\u305f",L"\u30bf",L"ta");
|
|
Insert(L"\u3061",L"\u30c1",L"chi");
|
|
Insert(L"\u3064",L"\u30c4",L"tsu");
|
|
Insert(L"\u3066",L"\u30c6",L"te");
|
|
Insert(L"\u3068",L"\u30c8",L"to");
|
|
|
|
BeginGroup();
|
|
Insert(L"\u306a",L"\u30ca",L"na");
|
|
Insert(L"\u306b",L"\u30cb",L"ni");
|
|
Insert(L"\u306c",L"\u30cc",L"nu");
|
|
Insert(L"\u306d",L"\u30cd",L"ne");
|
|
Insert(L"\u306e",L"\u30ce",L"no");
|
|
|
|
BeginGroup();
|
|
Insert(L"\u306f",L"\u30cf",L"ha");
|
|
Insert(L"\u3072",L"\u30d2",L"hi");
|
|
Insert(L"\u3075",L"\u30d5",L"fu");
|
|
Insert(L"\u3078",L"\u30d8",L"he");
|
|
Insert(L"\u307b",L"\u30db",L"ho");
|
|
|
|
BeginGroup();
|
|
Insert(L"\u307e",L"\u30de",L"ma");
|
|
Insert(L"\u307f",L"\u30df",L"mi");
|
|
Insert(L"\u3080",L"\u30e0",L"mu");
|
|
Insert(L"\u3081",L"\u30e1",L"me");
|
|
Insert(L"\u3082",L"\u30e2",L"mo");
|
|
|
|
BeginGroup();
|
|
Insert(L"\u3084",L"\u30e4",L"ya");
|
|
Insert(L"\u3086",L"\u30e6",L"yu");
|
|
Insert(L"\u3088",L"\u30e8",L"yo");
|
|
|
|
BeginGroup();
|
|
Insert(L"\u3089",L"\u30e9",L"ra");
|
|
Insert(L"\u308a",L"\u30ea",L"ri");
|
|
Insert(L"\u308b",L"\u30eb",L"ru");
|
|
Insert(L"\u308c",L"\u30ec",L"re");
|
|
Insert(L"\u308d",L"\u30ed",L"ro");
|
|
|
|
BeginGroup();
|
|
Insert(L"\u308f",L"\u30ef",L"wa");
|
|
Insert(L"\u3090",L"\u30f0",L"wi");
|
|
Insert(L"\u3091",L"\u30f1",L"we");
|
|
Insert(L"\u3092",L"\u30f2",L"wo");
|
|
|
|
BeginGroup();
|
|
level--;
|
|
Insert(L"\u3093",L"\u30f3",L"n");
|
|
|
|
BeginGroup();
|
|
Insert(L"\u304c",L"\u30ac",L"ga");
|
|
Insert(L"\u304e",L"\u30ae",L"gi");
|
|
Insert(L"\u3050",L"\u30b0",L"gu");
|
|
Insert(L"\u3052",L"\u30b2",L"ge");
|
|
Insert(L"\u3054",L"\u30b4",L"go");
|
|
|
|
BeginGroup();
|
|
Insert(L"\u3056",L"\u30b6",L"za");
|
|
Insert(L"\u3058",L"\u30b8",L"ji");
|
|
Insert(L"\u305a",L"\u30ba",L"zu");
|
|
Insert(L"\u305c",L"\u30bc",L"ze");
|
|
Insert(L"\u305e",L"\u30be",L"zo");
|
|
|
|
BeginGroup();
|
|
Insert(L"\u3060",L"\u30c0",L"da");
|
|
Insert(L"\u3062",L"\u30c2",L"ji");
|
|
Insert(L"\u3065",L"\u30c5",L"zu");
|
|
Insert(L"\u3067",L"\u30c7",L"de");
|
|
Insert(L"\u3069",L"\u30c9",L"do");
|
|
|
|
BeginGroup();
|
|
Insert(L"\u3070",L"\u30d0",L"ba");
|
|
Insert(L"\u3073",L"\u30d3",L"bi");
|
|
Insert(L"\u3076",L"\u30d6",L"bu");
|
|
Insert(L"\u3079",L"\u30d9",L"be");
|
|
Insert(L"\u307c",L"\u30dc",L"bo");
|
|
|
|
BeginGroup();
|
|
Insert(L"\u3071",L"\u30d1",L"pa");
|
|
Insert(L"\u3074",L"\u30d4",L"pi");
|
|
Insert(L"\u3077",L"\u30d7",L"pu");
|
|
Insert(L"\u307a",L"\u30da",L"pe");
|
|
Insert(L"\u307d",L"\u30dd",L"po");
|
|
|
|
BeginGroup();
|
|
Insert(L"\u304d\u3083",L"\u30ad\u30e3",L"kya");
|
|
Insert(L"\u304d\u3085",L"\u30ad\u30e5",L"kyu");
|
|
Insert(L"\u304d\u3087",L"\u30ad\u30e7",L"kyo");
|
|
|
|
BeginGroup();
|
|
Insert(L"\u3057\u3083",L"\u30b7\u30e3",L"sha");
|
|
Insert(L"\u3057\u3085",L"\u30b7\u30e5",L"shu");
|
|
Insert(L"\u3057\u3087",L"\u30b7\u30e7",L"sho");
|
|
|
|
BeginGroup();
|
|
Insert(L"\u3061\u3083",L"\u30c1\u30e3",L"cha");
|
|
Insert(L"\u3061\u3085",L"\u30c1\u30e5",L"chu");
|
|
Insert(L"\u3061\u3087",L"\u30c1\u30e7",L"cho");
|
|
|
|
BeginGroup();
|
|
Insert(L"\u306b\u3083",L"\u30cb\u30e3",L"nya");
|
|
Insert(L"\u306b\u3085",L"\u30cb\u30e5",L"nyu");
|
|
Insert(L"\u306b\u3087",L"\u30cb\u30e7",L"nyo");
|
|
|
|
BeginGroup();
|
|
Insert(L"\u3072\u3083",L"\u30d2\u30e3",L"hya");
|
|
Insert(L"\u3072\u3085",L"\u30d2\u30e5",L"hyu");
|
|
Insert(L"\u3072\u3087",L"\u30d2\u30e7",L"hyo");
|
|
|
|
BeginGroup();
|
|
Insert(L"\u307f\u3083",L"\u30df\u30e3",L"mya");
|
|
Insert(L"\u307f\u3085",L"\u30df\u30e5",L"myu");
|
|
Insert(L"\u307f\u3087",L"\u30df\u30e7",L"myo");
|
|
|
|
BeginGroup();
|
|
Insert(L"\u308a\u3083",L"\u30ea\u30e3",L"rya");
|
|
Insert(L"\u308a\u3085",L"\u30ea\u30e5",L"ryu");
|
|
Insert(L"\u308a\u3087",L"\u30ea\u30e7",L"ryo");
|
|
|
|
BeginGroup();
|
|
Insert(L"\u304e\u3083",L"\u30ae\u30e3",L"gya");
|
|
Insert(L"\u304e\u3085",L"\u30ae\u30e5",L"gyu");
|
|
Insert(L"\u304e\u3087",L"\u30ae\u30e7",L"gyo");
|
|
|
|
BeginGroup();
|
|
Insert(L"\u3058\u3083",L"\u30b8\u30e3",L"ja");
|
|
Insert(L"\u3058\u3085",L"\u30b8\u30e5",L"ju");
|
|
Insert(L"\u3058\u3087",L"\u30b8\u30e7",L"jo");
|
|
|
|
BeginGroup();
|
|
Insert(L"\u3062\u3083",L"\u30c2\u30e3",L"ja");
|
|
Insert(L"\u3062\u3085",L"\u30c2\u30e5",L"ju");
|
|
Insert(L"\u3062\u3087",L"\u30c2\u30e7",L"jo");
|
|
|
|
BeginGroup();
|
|
Insert(L"\u3073\u3083",L"\u30d3\u30e3",L"bya");
|
|
Insert(L"\u3073\u3085",L"\u30d3\u30e5",L"byu");
|
|
Insert(L"\u3073\u3087",L"\u30d3\u30e7",L"byo");
|
|
|
|
BeginGroup();
|
|
Insert(L"\u3074\u3083",L"\u30d4\u30e3",L"pya");
|
|
Insert(L"\u3074\u3085",L"\u30d4\u30e5",L"pyu");
|
|
Insert(L"\u3074\u3087",L"\u30d4\u30e7",L"pyo");
|
|
|
|
BeginGroup();
|
|
Insert(L"",L"\u30d5\u30a1",L"fa");
|
|
Insert(L"",L"\u30d5\u30a3",L"fi");
|
|
Insert(L"",L"\u30d5\u30a7",L"fe");
|
|
Insert(L"",L"\u30d5\u30a9",L"fo");
|
|
|
|
BeginGroup();
|
|
Insert(L"",L"\u30f4\u30a1",L"va");
|
|
Insert(L"",L"\u30f4\u30a3",L"vi");
|
|
Insert(L"",L"\u30f4",L"vu");
|
|
Insert(L"",L"\u30f4\u30a7",L"ve");
|
|
Insert(L"",L"\u30f4\u30a9",L"vo");
|
|
Insert(L"",L"\u30d5\u30e5",L"fyu");
|
|
|
|
BeginGroup();
|
|
Insert(L"",L"\u30a4\u30a7",L"ye");
|
|
Insert(L"",L"\u30a6\u30a3",L"wi");
|
|
Insert(L"",L"\u30a6\u30a7",L"we");
|
|
Insert(L"",L"\u30a6\u30a9",L"wo");
|
|
|
|
BeginGroup();
|
|
Insert(L"",L"\u30f4\u30e3",L"vya");
|
|
Insert(L"",L"\u30f4\u30e5",L"vyu");
|
|
Insert(L"",L"\u30f4\u30e7",L"vyo");
|
|
|
|
BeginGroup();
|
|
Insert(L"",L"\u30b7\u30a7",L"she");
|
|
Insert(L"",L"\u30b8\u30a7",L"je");
|
|
Insert(L"",L"\u30c1\u30a7",L"che");
|
|
|
|
BeginGroup();
|
|
Insert(L"",L"\u30c6\u30a3",L"ti");
|
|
Insert(L"",L"\u30c6\u30a5",L"tu");
|
|
Insert(L"",L"\u30c6\u30e5",L"tyu");
|
|
|
|
BeginGroup();
|
|
Insert(L"",L"\u30c7\u30a3",L"di");
|
|
Insert(L"",L"\u30c7\u30a5",L"du");
|
|
Insert(L"",L"\u30c7\u30a5",L"dyu");
|
|
|
|
BeginGroup();
|
|
Insert(L"",L"\u30c4\u30a1",L"tsa");
|
|
Insert(L"",L"\u30c4\u30a3",L"tsi");
|
|
Insert(L"",L"\u30c4\u30a7",L"tse");
|
|
Insert(L"",L"\u30c4\u30a9",L"tso");
|
|
}
|
|
|
|
|
|
//////////////
|
|
// Destructor
|
|
KanaTable::~KanaTable() {
|
|
}
|
|
|
|
|
|
///////////////
|
|
// Begin group
|
|
void KanaTable::BeginGroup() {
|
|
curGroup = _T("");
|
|
level++;
|
|
}
|
|
|
|
|
|
//////////
|
|
// Insert
|
|
void KanaTable::Insert(wchar_t *hira,wchar_t *kata,wchar_t *hep) {
|
|
#ifdef _UNICODE
|
|
KanaEntry entry(hira,kata,hep);
|
|
if (curGroup.IsEmpty()) curGroup = hep;
|
|
entry.group = curGroup;
|
|
entry.level = level;
|
|
if (!entry.hiragana.IsEmpty() && level > groups[0]) groups[0] = level;
|
|
if (!entry.katakana.IsEmpty() && level > groups[1]) groups[1] = level;
|
|
entries.push_back(entry);
|
|
#endif
|
|
}
|
|
|
|
|
|
/////////////////////
|
|
// Number of entries
|
|
int KanaTable::GetNumberEntries(int level) const {
|
|
if (level == -1) return entries.size();
|
|
else {
|
|
int count = 0;
|
|
int n = entries.size();
|
|
for (int i=0;i<n;i++) {
|
|
if (entries[i].level <= level) count++;
|
|
}
|
|
return count;
|
|
}
|
|
}
|
|
|
|
|
|
////////////////////////
|
|
// Get a specific entry
|
|
const KanaEntry &KanaTable::GetEntry(int i) const {
|
|
return entries.at(i);
|
|
}
|
|
|
|
|
|
//////////////////////////
|
|
// Find a specific romaji
|
|
const KanaEntry *KanaTable::FindByRomaji(wxString romaji) const {
|
|
int n = entries.size();
|
|
for (int i=0;i<n;i++) {
|
|
if (entries[i].hepburn == romaji) return &entries[i];
|
|
}
|
|
return NULL;
|
|
}
|
|
|
|
|
|
////////////////////////
|
|
// Find a specific kana
|
|
const KanaEntry *KanaTable::FindByKana(wxString kana) const {
|
|
int n = entries.size();
|
|
for (int i=0;i<n;i++) {
|
|
if (entries[i].hiragana == kana) return &entries[i];
|
|
if (entries[i].katakana == kana) return &entries[i];
|
|
}
|
|
return NULL;
|
|
}
|
|
|
|
|
|
/////////////////////////////////////////////
|
|
// Get number of levels for a specific table
|
|
int KanaTable::GetLevels(int table) const {
|
|
return groups[table];
|
|
}
|
|
|
|
|
|
//////////////////////////
|
|
// Convert kana to romaji
|
|
wxString KanaTable::KanaToRomaji(wxString kana,int type) {
|
|
// Prepare
|
|
wxString lastSyl;
|
|
wxString final;
|
|
bool ltsu = false;
|
|
bool longVowel = false;
|
|
|
|
// Look up the entries
|
|
for (size_t i=0;i<kana.Length();i++) {
|
|
// Find syllable
|
|
const KanaEntry *cur;
|
|
cur = FindByKana(kana.Mid(i,2));
|
|
if (cur) i++;
|
|
else cur = FindByKana(kana.Mid(i,1));
|
|
|
|
// Check if it's little tsu or long vowel in katakana
|
|
if (!cur) {
|
|
if (kana.Mid(i,1) == _T("\u3063") || kana.Mid(i,1) == _T("\uff6f") || kana.Mid(i,1) == _T("\u30c3")) {
|
|
ltsu = true;
|
|
continue;
|
|
}
|
|
|
|
if (kana.Mid(i,1) == _T("\u30fc") || kana.Mid(i,1) == _T("-")) {
|
|
longVowel = true;
|
|
}
|
|
}
|
|
|
|
// Append
|
|
if (cur || longVowel) {
|
|
bool vetoAdd = false;
|
|
|
|
// Hepburn
|
|
if (type == 1) {
|
|
if (longVowel) {
|
|
longVowel = false;
|
|
final += 0x304;
|
|
vetoAdd = true;
|
|
}
|
|
|
|
else {
|
|
// Check for need to add apostrophe
|
|
wxString fl;
|
|
if (lastSyl == _T("n")) {
|
|
fl = cur->hepburn.Left(1);
|
|
bool add = false;
|
|
if (fl == _T("y") || fl == _T("a") || fl == _T("e") || fl == _T("i") || fl == _T("o") || fl == _T("u")) add = true;
|
|
if (fl == _T("n") && cur->hiragana == _T("\u3063")) add = true;
|
|
if (add) final += _T("'");
|
|
}
|
|
|
|
// Check if it needs to add a macron
|
|
wxString last = lastSyl.Right(1);
|
|
wxString curV = cur->hepburn;
|
|
if ((last == _T("o") && curV == _T("u")) || (last == curV && last != _T("n") /*&& last != lastSyl */)) {
|
|
wchar_t macron;
|
|
switch(last[0]) {
|
|
case L'a': macron = 257; break;
|
|
case L'e': macron = 275; break;
|
|
case L'i': macron = 299; break;
|
|
case L'o': macron = 333; break;
|
|
case L'u': macron = 363; break;
|
|
}
|
|
final = final.Left(final.Length()-1) + macron;
|
|
vetoAdd = true;
|
|
}
|
|
}
|
|
}
|
|
|
|
// Wopura
|
|
else {
|
|
if (longVowel) {
|
|
longVowel = false;
|
|
final += lastSyl.Right(1);
|
|
vetoAdd = true;
|
|
}
|
|
}
|
|
|
|
// Add syllable
|
|
if (!vetoAdd) {
|
|
// Little tsu
|
|
if (ltsu) {
|
|
ltsu = false;
|
|
final += cur->hepburn.Left(1);
|
|
}
|
|
|
|
// Standard
|
|
final += cur->hepburn;
|
|
}
|
|
|
|
// Set last
|
|
if (cur) lastSyl = cur->hepburn;
|
|
}
|
|
}
|
|
return final;
|
|
}
|