Naraguna:Bennylin/trans-batak.js: Béda antara owahan
Konten dihapus Konten ditambahkan
Tanpa ringkesan besutan |
Tanpa ringkesan besutan |
||
Larik 60: | Larik 60: | ||
function getLanguage() { |
function getLanguage() { |
||
var |
var bahasa; |
||
var modeTranslit = document.getElementsByName("bahasa"); |
var modeTranslit = document.getElementsByName("bahasa"); |
||
for(var rad in modeTranslit) { |
for(var rad in modeTranslit) { |
||
Larik 100: | Larik 100: | ||
"A":'ᯀ', "E":'ᯀᯩ', "I":'ᯤ', "O":'ᯀᯭ', "U":'ᯥ', "X":'ᯀᯧ' |
"A":'ᯀ', "E":'ᯀᯩ', "I":'ᯤ', "O":'ᯀᯭ', "U":'ᯥ', "X":'ᯀᯧ' |
||
} |
} |
||
var matramap; |
|||
var bahasa = getLanguage(); |
var bahasa = getLanguage(); |
||
if (bahasa == "karo") |
if (bahasa == "karo") |
||
Larik 198: | Larik 199: | ||
"m":"ᯕ", "n":"ᯉ", "p":"ᯈ", "f":"ᯈ", "r":"ᯓ", "s":"ᯙ", "t":"ᯖ", "v":"ᯌ", "w":"ᯌ", "y":"ᯜ" |
"m":"ᯕ", "n":"ᯉ", "p":"ᯈ", "f":"ᯈ", "r":"ᯓ", "s":"ᯙ", "t":"ᯖ", "v":"ᯌ", "w":"ᯌ", "y":"ᯜ" |
||
} |
} |
||
var soundMap; |
|||
var bahasa = getLanguage(); |
var bahasa = getLanguage(); |
||
if (bahasa == "karo") |
if (bahasa == "karo") |
||
soundMap = soundMapK; |
|||
else if (bahasa == "simalungun") |
else if (bahasa == "simalungun") |
||
soundMap = soundMapS; |
|||
else if (bahasa == "toba") |
else if (bahasa == "toba") |
||
soundMap = soundMapT; |
|||
else if (bahasa == "pakpak-dairi") |
else if (bahasa == "pakpak-dairi") |
||
soundMap = soundMapPD; |
|||
else if (bahasa == "angkola-mandailing") |
else if (bahasa == "angkola-mandailing") |
||
soundMap = soundMapAM; |
|||
var h_shift = GetShift(str); |
var h_shift = GetShift(str); |
Révisi kala 2 April 2021 14.49
/*!
* trans.js
* https://bennylin.github.com/transliterasi/batak.html
*
* Copyright 2013-2021, Bennylin @bennylin
* Dual licensed under the MIT or GPL Version 2 licenses.
* Released under the MIT, BSD, and GPL Licenses.
*
* Versions:
* 1 April 2021 - v 1.0
* TODO: tompi, bindu, u_1bef, -ou simalungun
*
* Derived from my Javanese transliteration: https://jv.wikipedia.org/wiki/Naraguna:Bennylin/trans.js
*/
var vowelPrev = false;
/***************************
Function SuperTrim, findstr
trim string, menemukan karakter di dalam string
****************************/
function SuperTrim(str) {
str = str || '';
return str.replace(/^\s*|\s*$/g,'').replace(/\s+/g,' ');
}
function findstr(str,tofind) {
for (var i = 0; i < str.length; i++)
if (str[i] == tofind)
return true;
return false;
}
/***************************
Function isDigit, isPunct, isVowel
cek apakah digit, tanda baca, atau huruf vokal (a, e/è/é, i, o, u, ě/ê, ô, ā/ī/ū/ō)
****************************/
function isDigit(a) {
var str = "0123456789";
return findstr(str,a);
}
function isPunct(a) {
var str = ",.><?/+=-_}{[]*&^%$#@!~`\"\\|:;()";
return findstr(str,a);
}
function isVowel(a) {
var str = "AaEeÈèÉéIiOoUuÊêĚěXxôāīūō";
return findstr(str,a);
}
function isConsonant(a) {
var str = "BCDfGHJKLMNPQRSTVWXYZbcdfghjklmnpqrstvwxyz";
//QXqx are special chars, add engma & enye
return findstr(str,a);
}
/***************************
Function isSpecial, isHR, isLW
cek apakah karakter spesial (bikonsonan)
****************************/
function isSpecial(a) {
var str = "GgYyDdBb";
//untuk bikonsonan nga, nya, nda, mba
return findstr(str,a);
}
function getLanguage() {
var bahasa;
var modeTranslit = document.getElementsByName("bahasa");
for(var rad in modeTranslit) {
if(modeTranslit[rad].checked)
bahasa = modeTranslit[rad].value;
}
return bahasa;
}
/***************************
Function GetMatra
apabila huruf vokal, return matra (sandhangan swara)
****************************/
function GetMatra(str) {
var i = 0;
if (str.length < 1) {
return "";
}
while (str[i] == 'h') {
i++;
if (i >= str.length) {
break;
}
}
if (i < str.length) {
str = str.substring(i);
}
//Aksara i (ᯤ) dan u (ᯥ) hanya digunakan untuk suku kata terbuka, misal pada kata dan ina ᯤᯉ dan ulu ᯥᯞᯮ. Untuk suku kata tertutup yang diawali dengan bunyi i atau u, digunakanlah aksara a (ᯀ atau ᯁ) bersama diaktirik untuk masing-masing vokal, misal pada kata indung ᯀᯪᯉ᯲ᯑᯮᯰ dan umpama ᯀᯮᯔ᯲ᯇᯔ
//Huruf Latin kapital I dan U menghasilkan aksara-aksara "ina ni surat" ᯤ dan ᯥ, sementara huruf Latin kecil i dan u menghasilkan aksara-aksara "anak ni surat" ᯀᯪ dan ᯀᯮ.
var matramapT= { //toba, pakpak, mandailing
"e":'ᯩ', "é":'ᯩ', "i":'ᯪ', "o":'ᯬ', "u":'ᯮ', "x":'ᯧ',
"A":'ᯀ', "E":'ᯀᯩ', "I":'ᯤ', "O":'ᯀᯬ', "U":'ᯥ', "X":'ᯀᯧ'
}
var matramapS= { //simalungun
"e":'ᯩ', "é":'ᯩ', "i":'ᯫ', "o":'ᯬ', "u":'ᯮ', "x":'ᯧ',
"A":'ᯁ', "E":'ᯁᯩ', "I":'ᯤ', "O":'ᯁᯬ', "U":'ᯥ', "X":'ᯁᯧ'
}
var matramapK= { //karo
"e":'ᯩ', "é":'ᯩ', "i":'ᯫ', "o":'ᯭ', "u":'ᯬ', "x":'ᯧ',
"A":'ᯀ', "E":'ᯀᯩ', "I":'ᯤ', "O":'ᯀᯭ', "U":'ᯥ', "X":'ᯀᯧ'
}
var matramap;
var bahasa = getLanguage();
if (bahasa == "karo")
matramap = matramapK;
else if (bahasa == "simalungun")
matramap = matramapS;
else //if (bahasa == "toba" || bahasa == "pakpak-dairi" || bahasa == "angkola-mandailing")
matramap = matramapT;
if(matramap[str]!==undefined) {
return matramap[str];
}
return "";
}
/***************************
Function GetShift
apabila huruf bikonsonan, return karakter khusus
****************************/
function GetShift(str) {
str = str.toLowerCase();
if (str.indexOf("ng") == 0) {
//suku kata diawali 'ng'
if (str.indexOf("nga") == 0) {
return { "CoreSound": "" + "ᯝ", "len": 3 };
} else if (str.indexOf("nge") == 0) {
return { "CoreSound": "" + "ᯝᯩ", "len": 3 };
} else if (str.indexOf("ngi") == 0) {
return { "CoreSound": "" + "ᯝᯫ", "len": 3 };
} else if (str.indexOf("ngo") == 0) {
return { "CoreSound": "" + "ᯝᯬ", "len": 3 };
} else if (str.indexOf("ngu") == 0) {
return { "CoreSound": "" + "ᯝᯮ", "len": 3 };
} else {
return { "CoreSound": "ᯰ", "len": 2 }; //amisara (sandhangan / cecak)
}
}
//nya
if (str.indexOf("ny") == 0) {
//suku kata diawali 'ny'
return { "CoreSound": "ᯠ", "len": 2 };
} /*
if (str.indexOf("nd") == 0) {
//nd-
return { "CoreSound": "ᯢ", "len": 2 };
} *//*
if (str.indexOf("mb") == 0) {
//mb-
return { "CoreSound": "ᯣ", "len": 2 };
} */
return {
"CoreSound": null, "len": 1
}
;
}
/***************************
Function GetCoreSound
return aksara nglegana
****************************/
function GetCoreSound(str) {
var soundMapT = { //toba
"A":"ᯀ", "E":"ᯀᯩ", "I":"ᯤ", "O":"ᯀᯬ", "U":"ᯥ", "X":"ᯃ",
"a":"ᯀ", "e":"ᯀᯩ", "i":"ᯀᯪ", "o":"ᯀᯬ", "u":"ᯀᯮ", "x":"ᯃ",
"B":"ᯅ", "C":"ᯡ", "D":"ᯑ", "G":"ᯏ", "H":"ᯃ", "J":"ᯐ", "Z":"ᯐ", "K":"ᯃ", "Q":"ᯃ", "L":"ᯟ",
"M":"ᯕ", "N":"ᯉ", "P":"ᯈ", "F":"ᯈ", "R":"ᯓ", "S":"ᯙ", "T":"ᯖ", "V":"ᯌ", "W":"ᯌ", "Y":"ᯜ",
"b":"ᯅ", "c":"ᯡ", "d":"ᯑ", "g":"ᯏ", "h":"ᯃ", "j":"ᯐ", "z":"ᯐ", "k":"ᯃ", "q":"ᯃ", "l":"ᯟ",
"m":"ᯕ", "n":"ᯉ", "p":"ᯈ", "f":"ᯈ", "r":"ᯓ", "s":"ᯙ", "t":"ᯖ", "v":"ᯌ", "w":"ᯌ", "y":"ᯜ"
}
var soundMapS = { //simalungun
"A":"ᯁ", "E":"ᯀᯩ", "I":"ᯤ", "O":"ᯀᯬ", "U":"ᯥ", "X":"ᯃ",
"a":"ᯀ", "e":"ᯀᯩ", "i":"ᯀᯪ", "o":"ᯀᯬ", "u":"ᯀᯮ", "x":"ᯃ",
"B":"ᯅ", "C":"ᯡ", "D":"ᯑ", "G":"ᯏ", "H":"ᯃ", "J":"ᯐ", "Z":"ᯐ", "K":"ᯃ", "Q":"ᯃ", "L":"ᯟ",
"M":"ᯕ", "N":"ᯉ", "P":"ᯈ", "F":"ᯈ", "R":"ᯓ", "S":"ᯙ", "T":"ᯖ", "V":"ᯌ", "W":"ᯌ", "Y":"ᯜ",
"b":"ᯅ", "c":"ᯡ", "d":"ᯑ", "g":"ᯏ", "h":"ᯃ", "j":"ᯐ", "z":"ᯐ", "k":"ᯃ", "q":"ᯃ", "l":"ᯟ",
"m":"ᯕ", "n":"ᯉ", "p":"ᯈ", "f":"ᯈ", "r":"ᯓ", "s":"ᯙ", "t":"ᯖ", "v":"ᯌ", "w":"ᯌ", "y":"ᯜ"
}
var soundMapK = { //karo
"A":"ᯀ", "E":"ᯀᯩ", "I":"ᯤ", "O":"ᯀᯬ", "U":"ᯥ", "X":"ᯃ",
"a":"ᯀ", "e":"ᯀᯩ", "i":"ᯀᯪ", "o":"ᯀᯬ", "u":"ᯀᯮ", "x":"ᯃ",
"B":"ᯅ", "C":"ᯡ", "D":"ᯑ", "G":"ᯏ", "H":"ᯃ", "J":"ᯐ", "Z":"ᯐ", "K":"ᯃ", "Q":"ᯃ", "L":"ᯟ",
"M":"ᯕ", "N":"ᯉ", "P":"ᯈ", "F":"ᯈ", "R":"ᯓ", "S":"ᯙ", "T":"ᯖ", "V":"ᯌ", "W":"ᯌ", "Y":"ᯜ",
"b":"ᯅ", "c":"ᯡ", "d":"ᯑ", "g":"ᯏ", "h":"ᯃ", "j":"ᯐ", "z":"ᯐ", "k":"ᯃ", "q":"ᯃ", "l":"ᯟ",
"m":"ᯕ", "n":"ᯉ", "p":"ᯈ", "f":"ᯈ", "r":"ᯓ", "s":"ᯙ", "t":"ᯖ", "v":"ᯌ", "w":"ᯌ", "y":"ᯜ"
}
var soundMapAM = { //angkola-mandailing
"A":"ᯀ", "E":"ᯀᯩ", "I":"ᯤ", "O":"ᯀᯬ", "U":"ᯥ", "X":"ᯃ",
"a":"ᯀ", "e":"ᯀᯩ", "i":"ᯀᯪ", "o":"ᯀᯬ", "u":"ᯀᯮ", "x":"ᯃ",
"B":"ᯅ", "C":"ᯡ", "D":"ᯑ", "G":"ᯏ", "H":"ᯃ", "J":"ᯐ", "Z":"ᯐ", "K":"ᯃ", "Q":"ᯃ", "L":"ᯟ",
"M":"ᯕ", "N":"ᯉ", "P":"ᯈ", "F":"ᯈ", "R":"ᯓ", "S":"ᯙ", "T":"ᯖ", "V":"ᯌ", "W":"ᯌ", "Y":"ᯜ",
"b":"ᯅ", "c":"ᯡ", "d":"ᯑ", "g":"ᯏ", "h":"ᯃ", "j":"ᯐ", "z":"ᯐ", "k":"ᯃ", "q":"ᯃ", "l":"ᯟ",
"m":"ᯕ", "n":"ᯉ", "p":"ᯈ", "f":"ᯈ", "r":"ᯓ", "s":"ᯙ", "t":"ᯖ", "v":"ᯌ", "w":"ᯌ", "y":"ᯜ"
}
var soundMapPD = { //pakpak-dairi
"A":"ᯀ", "E":"ᯀᯩ", "I":"ᯤ", "O":"ᯀᯬ", "U":"ᯥ", "X":"ᯃ",
"a":"ᯀ", "e":"ᯀᯩ", "i":"ᯀᯪ", "o":"ᯀᯬ", "u":"ᯀᯮ", "x":"ᯃ",
"B":"ᯅ", "C":"ᯡ", "D":"ᯑ", "G":"ᯏ", "H":"ᯃ", "J":"ᯐ", "Z":"ᯐ", "K":"ᯃ", "Q":"ᯃ", "L":"ᯟ",
"M":"ᯕ", "N":"ᯉ", "P":"ᯈ", "F":"ᯈ", "R":"ᯓ", "S":"ᯙ", "T":"ᯖ", "V":"ᯌ", "W":"ᯌ", "Y":"ᯜ",
"b":"ᯅ", "c":"ᯡ", "d":"ᯑ", "g":"ᯏ", "h":"ᯃ", "j":"ᯐ", "z":"ᯐ", "k":"ᯃ", "q":"ᯃ", "l":"ᯟ",
"m":"ᯕ", "n":"ᯉ", "p":"ᯈ", "f":"ᯈ", "r":"ᯓ", "s":"ᯙ", "t":"ᯖ", "v":"ᯌ", "w":"ᯌ", "y":"ᯜ"
}
var soundMap;
var bahasa = getLanguage();
if (bahasa == "karo")
soundMap = soundMapK;
else if (bahasa == "simalungun")
soundMap = soundMapS;
else if (bahasa == "toba")
soundMap = soundMapT;
else if (bahasa == "pakpak-dairi")
soundMap = soundMapPD;
else if (bahasa == "angkola-mandailing")
soundMap = soundMapAM;
var h_shift = GetShift(str);
var core = str;
if (h_shift["CoreSound"] == null) {
if (soundMap[str.charAt(0)]) core = soundMap[str.charAt(0)];
return {
"CoreSound": core,
"len": 1
}
;
} else {
return h_shift;
}
}
/***************************
Function ResolveCharacterSound
return tanda baca, digit, vokal, maupun nglegana+pangkon
****************************/
function ResolveCharacterSound(c) {
var str = "" + c;
var len = 0;
if (isDigit(c)) {
return "" + ('' + (c - '0'));
} else if (isConsonant(str[0])) {
return "" + GetCoreSound(str).CoreSound + "᯲"; //virama pangolat
} else {
//if (isVowel(str[0])) {
return "" + GetCoreSound(str).CoreSound;
}
/**/
}
/***************************
Function GetSound
fungsi yang mentransliterasi masing-masing suku kata
****************************/
function GetSound(str) {
var len = 0;
str = SuperTrim(str);
str2 = str.toLowerCase();
if (str == null || str == "") {
return "";
}
if (str.length == 1) {
return ResolveCharacterSound(str[0]);
} else {
var core_sound = GetCoreSound(str);
//return "1"+core_sound.CoreSound+"2";
var matra = "";
var konsonan = "";
if (core_sound.len >= 1) {
matra = GetMatra(str.substring(core_sound.len)); //xeiou (pepet, taling, suku, taling tarung, wulu, dll.)
/*if () {
} else {
}*/
} else {
matra = ""; } //a/å/ɔ
/* rules for some cluster like ngg- that have different behaviour depending if it's the start of a word or not.
TODO: find more elegant solution */
if (str2.indexOf("ngg") == 0) { //ngg-
if (vowelPrev) konsonan = "ᯰᯎ";//<vowel>ngg-, e.g. tunggal
else konsonan = "ᯰᯎ";//<nonvowel>ngg-, i.e. nggambar
//for cluster longer than 4 consonants, such as "ditinggalnggambar",
//need to separate it by a space, "ditinggal nggambar" to be correct
} else if (core_sound.CoreSound == 'ᯱ' && matra == "᯲") { // wignyan
konsonan = "ᯂ"; //ha
} else if (core_sound.CoreSound == 'ᯱ' && matra != "᯲") { // wignyan
konsonan = "ᯂ"; //ha
} else if (core_sound.CoreSound == 'ᯰ' && matra == "᯲") { // cecak
konsonan = "ᯰ"; matra = "";//cecak
} else if (core_sound.CoreSound == 'ᯰ' && matra != "᯲") { // cecak
konsonan = "ᯝ"; //nga
} else {
konsonan = core_sound.CoreSound;
}
return "" + konsonan + matra;
}
}
/***************************
Function DoTransliterate
fungsi utama yang dipanggil (main function)
****************************/
function DoTransliterate(str) {
var i = 0;
var ret = "";
var pi = 0;
var vowelFlag = false;
startVowel = false;
str = SuperTrim(str);
while (i < str.length) {
if (i > 0 && isVowel(str[i]) && isVowel(str[i-1])) { //deal with words that start with multiple vocals
str = str.substring(0, i)+''+str.substring(i, str.length);
}
if ((isSpecial(str[i])) && !vowelFlag) {
//i++;
} else if ((str[i] == 'h' && vowelFlag) || (!isVowel(str[i]) && i > 0) || (str[i] == ' ') || isPunct(str[i]) || isDigit(str[i]) || ((i - pi) > 5)) {
ret += GetSound(str.substring(pi, i));
if (str[i] == ' ') { ret += ' '; }
if (isPunct(str[i])) {
ret += str[i];
pi = i + 1;
} else {
pi = i;
}
vowelFlag = false;
} else if (isVowel(str[i]) && str[i] != 'h') {
//ret += GetSound(str.substring(pi, i));
vowelFlag = true;
}
if (pi > 0 && isVowel(str[pi-1])) {
//<vowel>ngg
vowelPrev = true;
} else vowelPrev = false;
i++;
}
//endwhile
if (pi < i) {
ret += GetSound(str.substring(pi, i));
}
return SuperTrim(ret);
}