Naraguna:Bennylin/trans-batak.js: Béda antara owahan

Saka Wikipédia Jawa, bauwarna mardika basa Jawa
Konten dihapus Konten ditambahkan
Tanpa ringkesan besutan
Tanpa ringkesan besutan
Larik 60: Larik 60:


function getLanguage() {
function getLanguage() {
var matramap, bahasa;
var bahasa;
var modeTranslit = document.getElementsByName("bahasa");
var modeTranslit = document.getElementsByName("bahasa");
for(var rad in modeTranslit) {
for(var rad in modeTranslit) {
Larik 100: Larik 100:
"A":'ᯀ', "E":'ᯀᯩ', "I":'ᯤ', "O":'ᯀᯭ', "U":'ᯥ', "X":'ᯀᯧ'
"A":'ᯀ', "E":'ᯀᯩ', "I":'ᯤ', "O":'ᯀᯭ', "U":'ᯥ', "X":'ᯀᯧ'
}
}
var matramap;
var bahasa = getLanguage();
var bahasa = getLanguage();
if (bahasa == "karo")
if (bahasa == "karo")
Larik 198: Larik 199:
"m":"ᯕ", "n":"ᯉ", "p":"ᯈ", "f":"ᯈ", "r":"ᯓ", "s":"ᯙ", "t":"ᯖ", "v":"ᯌ", "w":"ᯌ", "y":"ᯜ"
"m":"ᯕ", "n":"ᯉ", "p":"ᯈ", "f":"ᯈ", "r":"ᯓ", "s":"ᯙ", "t":"ᯖ", "v":"ᯌ", "w":"ᯌ", "y":"ᯜ"
}
}
var soundMap;
var bahasa = getLanguage();
var bahasa = getLanguage();
if (bahasa == "karo")
if (bahasa == "karo")
matramap = matramapK;
soundMap = soundMapK;
else if (bahasa == "simalungun")
else if (bahasa == "simalungun")
matramap = matramapS;
soundMap = soundMapS;
else if (bahasa == "toba")
else if (bahasa == "toba")
matramap = matramapT;
soundMap = soundMapT;
else if (bahasa == "pakpak-dairi")
else if (bahasa == "pakpak-dairi")
matramap = matramapPD;
soundMap = soundMapPD;
else if (bahasa == "angkola-mandailing")
else if (bahasa == "angkola-mandailing")
matramap = matramapAM;
soundMap = soundMapAM;


var h_shift = GetShift(str);
var h_shift = GetShift(str);

Révisi kala 2 April 2021 14.49

/*!
* trans.js
* https://bennylin.github.com/transliterasi/batak.html
*
* Copyright 2013-2021, Bennylin @bennylin
* Dual licensed under the MIT or GPL Version 2 licenses.
* Released under the MIT, BSD, and GPL Licenses.
*
* Versions:
* 1 April 2021 - v 1.0
* TODO: tompi, bindu, u_1bef, -ou simalungun
*
* Derived from my Javanese transliteration: https://jv.wikipedia.org/wiki/Naraguna:Bennylin/trans.js
*/
var vowelPrev = false;
/***************************
Function SuperTrim, findstr
trim string, menemukan karakter di dalam string
****************************/
function SuperTrim(str) {
	str = str || '';
	return str.replace(/^\s*|\s*$/g,'').replace(/\s+/g,' ');
}
function findstr(str,tofind) {
	for (var i = 0; i < str.length; i++)
	if (str[i] == tofind)
	return true;
	return false;
}
/***************************
Function isDigit, isPunct, isVowel
cek apakah digit, tanda baca, atau huruf vokal (a, e/è/é, i, o, u, ě/ê, ô, ā/ī/ū/ō)
****************************/
function isDigit(a) {
	var str = "0123456789";
	return findstr(str,a);
}
function isPunct(a) {
	var str = ",.><?/+=-_}{[]*&^%$#@!~`\"\\|:;()";
	return findstr(str,a);
}
function isVowel(a) {
	var str = "AaEeÈèÉéIiOoUuÊêĚěXxôāīūō";
	return findstr(str,a);
}
function isConsonant(a) {
	var str = "BCDfGHJKLMNPQRSTVWXYZbcdfghjklmnpqrstvwxyz";
	//QXqx are special chars, add engma & enye
	return findstr(str,a);
}
/***************************
Function isSpecial, isHR, isLW
cek apakah karakter spesial (bikonsonan)
****************************/
function isSpecial(a) {
	var str = "GgYyDdBb";
	//untuk bikonsonan nga, nya, nda, mba
	return findstr(str,a);
}

function getLanguage() {
    var bahasa;
    var modeTranslit = document.getElementsByName("bahasa");
    for(var rad in modeTranslit) {
      if(modeTranslit[rad].checked)
        bahasa = modeTranslit[rad].value;
    }
    return bahasa;
}
/***************************
Function GetMatra
apabila huruf vokal, return matra (sandhangan swara)
****************************/
function GetMatra(str) {
	var i = 0;
	if (str.length < 1) {
		return "";
	}
	while (str[i] == 'h') {
		i++;
		if (i >= str.length) {
			break;
		}
	}
	if (i < str.length) {
		str = str.substring(i);
	}
    //Aksara i (ᯤ) dan u (ᯥ) hanya digunakan untuk suku kata terbuka, misal pada kata dan ina ᯤᯉ dan ulu ᯥᯞᯮ. Untuk suku kata tertutup yang diawali dengan bunyi i atau u, digunakanlah aksara a (ᯀ atau ᯁ) bersama diaktirik untuk masing-masing vokal, misal pada kata indung ᯀᯪᯉ᯲ᯑᯮᯰ dan umpama ᯀᯮᯔ᯲ᯇᯔ
    //Huruf Latin kapital I dan U menghasilkan aksara-aksara "ina ni surat"  ᯤ dan ᯥ, sementara huruf Latin kecil i dan u menghasilkan aksara-aksara "anak ni surat" ᯀᯪ dan ᯀᯮ.
	var matramapT= { //toba, pakpak, mandailing
		"e":'ᯩ', "é":'ᯩ', "i":'ᯪ', "o":'ᯬ', "u":'ᯮ', "x":'ᯧ',
		"A":'ᯀ', "E":'ᯀᯩ', "I":'ᯤ', "O":'ᯀᯬ', "U":'ᯥ', "X":'ᯀᯧ'
	} 
	var matramapS= { //simalungun
		"e":'ᯩ', "é":'ᯩ', "i":'ᯫ', "o":'ᯬ', "u":'ᯮ', "x":'ᯧ',
		"A":'ᯁ', "E":'ᯁᯩ', "I":'ᯤ', "O":'ᯁᯬ', "U":'ᯥ', "X":'ᯁᯧ'
	} 
	var matramapK= { //karo
		"e":'ᯩ', "é":'ᯩ', "i":'ᯫ', "o":'ᯭ', "u":'ᯬ', "x":'ᯧ',
		"A":'ᯀ', "E":'ᯀᯩ', "I":'ᯤ', "O":'ᯀᯭ', "U":'ᯥ', "X":'ᯀᯧ'
	}
    var matramap;
    var bahasa = getLanguage();
    if (bahasa == "karo")
      matramap = matramapK;
    else if (bahasa == "simalungun")
      matramap = matramapS;
    else //if (bahasa == "toba" || bahasa == "pakpak-dairi" || bahasa == "angkola-mandailing")
      matramap = matramapT;

	if(matramap[str]!==undefined) {
		return matramap[str];
	}
	return "";
}
/***************************
Function GetShift
apabila huruf bikonsonan, return karakter khusus
****************************/
function GetShift(str) {
	str = str.toLowerCase();
	if (str.indexOf("ng") == 0) {
		//suku kata diawali 'ng'
      if (str.indexOf("nga") == 0) {
        return { "CoreSound": "" + "ᯝ", "len": 3 };
      } else if (str.indexOf("nge") == 0) {
        return { "CoreSound": "" + "ᯝᯩ", "len": 3 };
      } else if (str.indexOf("ngi") == 0) {
        return { "CoreSound": "" + "ᯝᯫ", "len": 3 };
      } else if (str.indexOf("ngo") == 0) {
        return { "CoreSound": "" + "ᯝᯬ", "len": 3 };
      } else if (str.indexOf("ngu") == 0) {
        return { "CoreSound": "" + "ᯝᯮ", "len": 3 };
      } else {
		return { "CoreSound": "ᯰ", "len": 2 }; //amisara (sandhangan / cecak)
      }
	} 
	//nya
	if (str.indexOf("ny") == 0) {
		//suku kata diawali 'ny'
		return { "CoreSound": "ᯠ", "len": 2 };
	} /*
	if (str.indexOf("nd") == 0) {
		//nd-
		return { "CoreSound": "ᯢ", "len": 2 };
	} *//*
	if (str.indexOf("mb") == 0) {
		//mb-
		return { "CoreSound": "ᯣ", "len": 2 };
	} */
	return {
		"CoreSound": null, "len": 1
	}
	;
}
/***************************
Function GetCoreSound
return aksara nglegana
****************************/
function GetCoreSound(str) {
	var soundMapT = { //toba
		"A":"ᯀ", "E":"ᯀᯩ", "I":"ᯤ", "O":"ᯀᯬ", "U":"ᯥ", "X":"ᯃ", 
		"a":"ᯀ", "e":"ᯀᯩ", "i":"ᯀᯪ", "o":"ᯀᯬ", "u":"ᯀᯮ", "x":"ᯃ", 
		"B":"ᯅ", "C":"ᯡ", "D":"ᯑ", "G":"ᯏ", "H":"ᯃ", "J":"ᯐ", "Z":"ᯐ", "K":"ᯃ", "Q":"ᯃ", "L":"ᯟ", 
		"M":"ᯕ", "N":"ᯉ", "P":"ᯈ", "F":"ᯈ", "R":"ᯓ", "S":"ᯙ", "T":"ᯖ", "V":"ᯌ", "W":"ᯌ", "Y":"ᯜ", 
		"b":"ᯅ", "c":"ᯡ", "d":"ᯑ", "g":"ᯏ", "h":"ᯃ", "j":"ᯐ", "z":"ᯐ", "k":"ᯃ", "q":"ᯃ", "l":"ᯟ",
		"m":"ᯕ", "n":"ᯉ", "p":"ᯈ", "f":"ᯈ", "r":"ᯓ", "s":"ᯙ", "t":"ᯖ", "v":"ᯌ", "w":"ᯌ", "y":"ᯜ"
	}
	var soundMapS = { //simalungun
		"A":"ᯁ", "E":"ᯀᯩ", "I":"ᯤ", "O":"ᯀᯬ", "U":"ᯥ", "X":"ᯃ", 
		"a":"ᯀ", "e":"ᯀᯩ", "i":"ᯀᯪ", "o":"ᯀᯬ", "u":"ᯀᯮ", "x":"ᯃ", 
		"B":"ᯅ", "C":"ᯡ", "D":"ᯑ", "G":"ᯏ", "H":"ᯃ", "J":"ᯐ", "Z":"ᯐ", "K":"ᯃ", "Q":"ᯃ", "L":"ᯟ", 
		"M":"ᯕ", "N":"ᯉ", "P":"ᯈ", "F":"ᯈ", "R":"ᯓ", "S":"ᯙ", "T":"ᯖ", "V":"ᯌ", "W":"ᯌ", "Y":"ᯜ", 
		"b":"ᯅ", "c":"ᯡ", "d":"ᯑ", "g":"ᯏ", "h":"ᯃ", "j":"ᯐ", "z":"ᯐ", "k":"ᯃ", "q":"ᯃ", "l":"ᯟ",
		"m":"ᯕ", "n":"ᯉ", "p":"ᯈ", "f":"ᯈ", "r":"ᯓ", "s":"ᯙ", "t":"ᯖ", "v":"ᯌ", "w":"ᯌ", "y":"ᯜ"
	}
	var soundMapK = { //karo
		"A":"ᯀ", "E":"ᯀᯩ", "I":"ᯤ", "O":"ᯀᯬ", "U":"ᯥ", "X":"ᯃ", 
		"a":"ᯀ", "e":"ᯀᯩ", "i":"ᯀᯪ", "o":"ᯀᯬ", "u":"ᯀᯮ", "x":"ᯃ", 
		"B":"ᯅ", "C":"ᯡ", "D":"ᯑ", "G":"ᯏ", "H":"ᯃ", "J":"ᯐ", "Z":"ᯐ", "K":"ᯃ", "Q":"ᯃ", "L":"ᯟ", 
		"M":"ᯕ", "N":"ᯉ", "P":"ᯈ", "F":"ᯈ", "R":"ᯓ", "S":"ᯙ", "T":"ᯖ", "V":"ᯌ", "W":"ᯌ", "Y":"ᯜ", 
		"b":"ᯅ", "c":"ᯡ", "d":"ᯑ", "g":"ᯏ", "h":"ᯃ", "j":"ᯐ", "z":"ᯐ", "k":"ᯃ", "q":"ᯃ", "l":"ᯟ",
		"m":"ᯕ", "n":"ᯉ", "p":"ᯈ", "f":"ᯈ", "r":"ᯓ", "s":"ᯙ", "t":"ᯖ", "v":"ᯌ", "w":"ᯌ", "y":"ᯜ"
	}
	var soundMapAM = { //angkola-mandailing
		"A":"ᯀ", "E":"ᯀᯩ", "I":"ᯤ", "O":"ᯀᯬ", "U":"ᯥ", "X":"ᯃ", 
		"a":"ᯀ", "e":"ᯀᯩ", "i":"ᯀᯪ", "o":"ᯀᯬ", "u":"ᯀᯮ", "x":"ᯃ", 
		"B":"ᯅ", "C":"ᯡ", "D":"ᯑ", "G":"ᯏ", "H":"ᯃ", "J":"ᯐ", "Z":"ᯐ", "K":"ᯃ", "Q":"ᯃ", "L":"ᯟ", 
		"M":"ᯕ", "N":"ᯉ", "P":"ᯈ", "F":"ᯈ", "R":"ᯓ", "S":"ᯙ", "T":"ᯖ", "V":"ᯌ", "W":"ᯌ", "Y":"ᯜ", 
		"b":"ᯅ", "c":"ᯡ", "d":"ᯑ", "g":"ᯏ", "h":"ᯃ", "j":"ᯐ", "z":"ᯐ", "k":"ᯃ", "q":"ᯃ", "l":"ᯟ",
		"m":"ᯕ", "n":"ᯉ", "p":"ᯈ", "f":"ᯈ", "r":"ᯓ", "s":"ᯙ", "t":"ᯖ", "v":"ᯌ", "w":"ᯌ", "y":"ᯜ"
	}
	var soundMapPD = { //pakpak-dairi
		"A":"ᯀ", "E":"ᯀᯩ", "I":"ᯤ", "O":"ᯀᯬ", "U":"ᯥ", "X":"ᯃ", 
		"a":"ᯀ", "e":"ᯀᯩ", "i":"ᯀᯪ", "o":"ᯀᯬ", "u":"ᯀᯮ", "x":"ᯃ", 
		"B":"ᯅ", "C":"ᯡ", "D":"ᯑ", "G":"ᯏ", "H":"ᯃ", "J":"ᯐ", "Z":"ᯐ", "K":"ᯃ", "Q":"ᯃ", "L":"ᯟ", 
		"M":"ᯕ", "N":"ᯉ", "P":"ᯈ", "F":"ᯈ", "R":"ᯓ", "S":"ᯙ", "T":"ᯖ", "V":"ᯌ", "W":"ᯌ", "Y":"ᯜ", 
		"b":"ᯅ", "c":"ᯡ", "d":"ᯑ", "g":"ᯏ", "h":"ᯃ", "j":"ᯐ", "z":"ᯐ", "k":"ᯃ", "q":"ᯃ", "l":"ᯟ",
		"m":"ᯕ", "n":"ᯉ", "p":"ᯈ", "f":"ᯈ", "r":"ᯓ", "s":"ᯙ", "t":"ᯖ", "v":"ᯌ", "w":"ᯌ", "y":"ᯜ"
	}
    var soundMap;
    var bahasa = getLanguage();
    if (bahasa == "karo")
      soundMap = soundMapK;
    else if (bahasa == "simalungun")
      soundMap = soundMapS;
    else if (bahasa == "toba")
      soundMap = soundMapT;
    else if (bahasa == "pakpak-dairi")
      soundMap = soundMapPD;
    else if (bahasa == "angkola-mandailing")
      soundMap = soundMapAM;

	var h_shift = GetShift(str);
	var core = str;
	if (h_shift["CoreSound"] == null) {
		if (soundMap[str.charAt(0)]) core = soundMap[str.charAt(0)];
		return {
			"CoreSound": core,
			"len": 1
		}
		;
	} else {
		return h_shift;
	}
}
/***************************
Function ResolveCharacterSound
return tanda baca, digit, vokal, maupun nglegana+pangkon
****************************/
function ResolveCharacterSound(c) {
	var str = "" + c;
	var len = 0;
	if (isDigit(c)) {
		return "" + ('' + (c - '0'));
	} else if (isConsonant(str[0])) {
		return "" + GetCoreSound(str).CoreSound + "᯲"; //virama pangolat
	} else {
		//if (isVowel(str[0])) {
		return "" + GetCoreSound(str).CoreSound;
	}
	/**/
}
/***************************
Function GetSound
fungsi yang mentransliterasi masing-masing suku kata
****************************/
function GetSound(str) {

    var len = 0;
    str = SuperTrim(str);
    str2 = str.toLowerCase();
    if (str == null || str == "") {
        return "";
    }
    if (str.length == 1) {
        return ResolveCharacterSound(str[0]);
    } else {
        var core_sound = GetCoreSound(str);
        //return "1"+core_sound.CoreSound+"2";
        var matra = "";
        var konsonan = "";
            if (core_sound.len >= 1) {
                matra = GetMatra(str.substring(core_sound.len)); //xeiou (pepet, taling, suku, taling tarung, wulu, dll.)
                /*if () {

                } else {

                }*/
            } else {
                matra = ""; } //a/å/ɔ

/* rules for some cluster like ngg- that have different behaviour depending if it's the start of a word or not.
TODO: find more elegant solution */
        if (str2.indexOf("ngg") == 0) { //ngg-
            if (vowelPrev) konsonan = "ᯰᯎ";//<vowel>ngg-, e.g. tunggal
            else konsonan = "ᯰᯎ";//<nonvowel>ngg-, i.e. nggambar
            //for cluster longer than 4 consonants, such as "ditinggalnggambar",
            //need to separate it by a space, "ditinggal nggambar" to be correct

        } else if (core_sound.CoreSound == 'ᯱ' && matra == "᯲") { // wignyan
            konsonan = "ᯂ"; //ha
        } else if (core_sound.CoreSound == 'ᯱ' && matra != "᯲") { // wignyan
            konsonan = "ᯂ"; //ha
        } else if (core_sound.CoreSound == 'ᯰ​' && matra == "᯲") { // cecak
            konsonan = "ᯰ​"; matra = "";//cecak
        } else if (core_sound.CoreSound == 'ᯰ​' && matra != "᯲") { // cecak
            konsonan = "ᯝ"; //nga
        } else {
            konsonan = core_sound.CoreSound;
        }
        return "" + konsonan + matra;
    }
}
/***************************
Function DoTransliterate
fungsi utama yang dipanggil (main function)
****************************/
function DoTransliterate(str) {
	var i = 0;
	var ret = "";
	var pi = 0;
	var vowelFlag = false;
	startVowel = false;
	str = SuperTrim(str);
	while (i < str.length) {

        if (i > 0 && isVowel(str[i]) && isVowel(str[i-1])) { //deal with words that start with multiple vocals
               str = str.substring(0, i)+'​'+str.substring(i, str.length);
        }
		if ((isSpecial(str[i])) && !vowelFlag) {
			//i++;
		} else if ((str[i] == 'h' && vowelFlag) || (!isVowel(str[i]) && i > 0) || (str[i] == ' ') || isPunct(str[i]) || isDigit(str[i]) || ((i - pi) > 5)) {
			ret += GetSound(str.substring(pi, i));
            if (str[i] == ' ') { ret += ' '; }
			if (isPunct(str[i])) {
					ret += str[i];
					pi = i + 1;
			} else {
				pi = i;
			}
			vowelFlag = false;
		} else if (isVowel(str[i]) && str[i] != 'h') {
			//ret += GetSound(str.substring(pi, i));
			vowelFlag = true;
		}
		if (pi > 0 && isVowel(str[pi-1])) {
			//<vowel>ngg
			vowelPrev = true;
		} else vowelPrev = false;
		i++;
	}
	//endwhile
	if (pi < i) {
		ret += GetSound(str.substring(pi, i));
	}
	return SuperTrim(ret);
}