TengwarTranslator/src/net/agspace/translate/Translator.java

609 lines
23 KiB
Java
Raw Blame History

This file contains ambiguous Unicode characters

This file contains Unicode characters that might be confused with other characters. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.

package net.agspace.translate;
import java.util.*;
/**
* Created by Andrew's Computer on 23-Apr-17.
*/
public class Translator {
//Consonant variables.
private static final char B = 'w';
private static final char C = 'c';
private static final char D = '2';
private static final char F = 'e';
private static final char G = 'x';
private static final char H = '9';
private static final char J = 's';
private static final char K = 'z';
private static final char L = 'j';
private static final char M = 't';
private static final char N = '5';
private static final char P = 'q';
private static final char Q = 'n';
private static final char R = '6';
private static final char S = '8';
private static final char T = '1';
private static final char V = 'r';
private static final char W = 'y';
private static final char X = '¦';
private static final char Y = 'h';
private static final char Z = 'k';
//Compound chars.
private static final char TH = '3';
private static final char CH = 'a';
private static final char SH = 'd';
private static final char ZH = 'f';
private static final char GH = 'v';
private static final char WH = 'o';
private static final char CK = 'Z';
private static final char NY = 'g';
private static final char NG = 'b';
private static final char RD = 'u';
private static final char LD = 'm';
//Vowels.
private static final char A_1 = '#';
private static final char A_2 = 'E';
private static final char A_3 = 'D';
private static final char A_4 = 'C';
private static final char E_1 = '$';
private static final char E_2 = 'R';
private static final char E_3 = 'F';
private static final char E_4 = 'V';
private static final char E_UNDER_1 = 'È';
private static final char E_UNDER_2 = 'É';
private static final char E_UNDER_3 = 'Ê';
private static final char E_UNDER_4 = 'Ë';
private static final char E_LAMBE = 'L';
private static final char I_1 = '%';
private static final char I_2 = 'T';
private static final char I_3 = 'G';
private static final char I_4 = 'B';
private static final char O_1 = '^';
private static final char O_2 = 'Y';
private static final char O_3 = 'H';
private static final char O_4 = 'N';
private static final char U_1 = '&';
private static final char U_2 = 'U';
private static final char U_3 = 'J';
private static final char U_4 = 'M';
//Carriers.
private static final char CARRIER_LONG = '~';
private static final char CARRIER_SHORT = '`';
//Numbers.
private static final char NUMBER_0 = 'ð';
private static final char NUMBER_1 = 'ñ';
private static final char NUMBER_2 = 'ò';
private static final char NUMBER_3 = 'ó';
private static final char NUMBER_4 = 'ô';
private static final char NUMBER_5 = 'õ';
private static final char NUMBER_6 = 'ö';
private static final char NUMBER_7 = '÷';
private static final char NUMBER_8 = 'ø';
private static final char NUMBER_9 = 'ù';
//Punctuation
private static final char PERIOD = '-';
private static final char COMMA = '=';
private static final char EXCLAMATION = 'Á';
private static final char QUESTION = 'À';
private static final char SEMICOLON = 'Ã';
private static final char COLON = 'ˆ';
private static final char PARENTHESES_RIGHT = 'œ';
private static final char PARENTHESES_LEFT = 'Œ';
private static final char QUOTE = '«';
private static final char APOSTROPHE = '±';
private static final char SPACE = ' ';
private static final char EQUALS = '¬';
private static final char MINUS = '\\';
private static final char NEWLINE = '\n';
//Doubles Bars
private static final char BAR_SHORT_TOP = '[';
private static final char BAR_SHORT_BOTTOM = '\'';
private static final char BAR_LONG_TOP = '{';
private static final char BAR_LONG_BOTTOM = '"';
//Alternate forms.
private static final char S_ALT = 'i';
private static final char Z_ALT = ',';
private static final char W_ALT = '.';
private static final char R_ALT = '7';
private static final char Y_ALT = 'l';
//S-Curls
private static final char S_CURL_1 = '+';
private static final char S_CURL_2 = '_';
private static final char S_CURL_3 = '¢';
//Mappings of english chars to tengwars.
private static final Map<Character, Character> consonantChars = new HashMap<>();
static {
consonantChars.put('b', B);
consonantChars.put('c', C);
consonantChars.put('d', D);
consonantChars.put('f', F);
consonantChars.put('g', G);
consonantChars.put('h', H);
consonantChars.put('j', J);
consonantChars.put('k', K);
consonantChars.put('l', L);
consonantChars.put('m', M);
consonantChars.put('n', N);
consonantChars.put('p', P);
consonantChars.put('q', Q);
consonantChars.put('r', R);
consonantChars.put('s', S);
consonantChars.put('t', T);
consonantChars.put('v', V);
consonantChars.put('w', W);
consonantChars.put('x', X);
consonantChars.put('y', Y);
consonantChars.put('z', Z);
}
//Mapping for compound chars.
private static final Map<String, Character> compoundChars = new HashMap<>();
static {
compoundChars.put("th", TH);
compoundChars.put("ch", CH);
compoundChars.put("sh", SH);
compoundChars.put("zh", ZH);
compoundChars.put("gh", GH);
compoundChars.put("wh", WH);
compoundChars.put("ck", CK);
compoundChars.put("ny", NY);
compoundChars.put("ng", NG);
compoundChars.put("rd", RD);
compoundChars.put("ld", LD);
}
//Mapping consonants to alternates.
private static final Map<Character, Character> alternateChars = new HashMap<>();
static {
alternateChars.put('s', S_ALT);
alternateChars.put('z', Z_ALT);
alternateChars.put('w', W_ALT);
alternateChars.put('y', Y_ALT);
}
//Mapping for numbers. No vowel size needed.
private static final Map<Character, Character> numberChars = new HashMap<>();
static {
numberChars.put('0', NUMBER_0);
numberChars.put('1', NUMBER_1);
numberChars.put('2', NUMBER_2);
numberChars.put('3', NUMBER_3);
numberChars.put('4', NUMBER_4);
numberChars.put('5', NUMBER_5);
numberChars.put('6', NUMBER_6);
numberChars.put('7', NUMBER_7);
numberChars.put('8', NUMBER_8);
numberChars.put('9', NUMBER_9);
}
//Mapping for punctuation. No vowel size needed.
private static final Map<Character, Character> punctuationChars = new HashMap<>();
static {
punctuationChars.put('.', PERIOD);
punctuationChars.put(',', COMMA);
punctuationChars.put('!', EXCLAMATION);
punctuationChars.put('?', QUESTION);
punctuationChars.put(';', SEMICOLON);
punctuationChars.put(':', COLON);
punctuationChars.put(')', PARENTHESES_RIGHT);
punctuationChars.put('(', PARENTHESES_LEFT);
punctuationChars.put('"', QUOTE);
punctuationChars.put('\'', APOSTROPHE);
punctuationChars.put(' ', SPACE);
punctuationChars.put('=', EQUALS);
punctuationChars.put('-', MINUS);
punctuationChars.put('\n', NEWLINE);
}
//Mapping for vowels. Each value is an array, with A_1 to A_4 in indices 0 - 3.
private static final Map<Character, Character[]> vowelChars = new HashMap<>();
static {
vowelChars.put('a', new Character[]{A_1, A_2, A_3, A_4});
vowelChars.put('e', new Character[]{E_1, E_2, E_3, E_4, E_UNDER_1, E_UNDER_2, E_UNDER_3, E_UNDER_4});
vowelChars.put('i', new Character[]{I_1, I_2, I_3, I_4});
vowelChars.put('o', new Character[]{O_1, O_2, O_3, O_4});
vowelChars.put('u', new Character[]{U_1, U_2, U_3, U_4});
}
//For the characters which allow a vowel above them, this tells which vowel type to use.
private static final Map<Character, Integer> charSizes = new HashMap<>();
static {
charSizes.put(B, 1);
charSizes.put(C, 2);
charSizes.put(D, 1);
charSizes.put(F, 3);
charSizes.put(G, 1);
charSizes.put(H, 3);
charSizes.put(J, 1);
charSizes.put(K, 2);
charSizes.put(L, 1);
charSizes.put(M, 1);
charSizes.put(N, 1);
charSizes.put(P, 2);
charSizes.put(Q, 2);
charSizes.put(R, 2);
charSizes.put(S, 1);
charSizes.put(T, 2);
charSizes.put(V, 1);
charSizes.put(W, 2);
charSizes.put(X, 1);
charSizes.put(Y, 2);
charSizes.put(Z, 1);
charSizes.put(S_ALT, 2);
charSizes.put(Z_ALT, 2);
charSizes.put(W_ALT, 2);
charSizes.put(R_ALT, 2);
charSizes.put(Y_ALT, 2);
charSizes.put(TH, 3);
charSizes.put(CH, 2);
charSizes.put(SH, 2);
charSizes.put(ZH, 1);
charSizes.put(GH, 1);
charSizes.put(WH, 1);
charSizes.put(CK, 1);
charSizes.put(NY, 1);
charSizes.put(NG, 1);
charSizes.put(RD, 2);
charSizes.put(LD, 1);
charSizes.put(CARRIER_LONG, 4);
charSizes.put(CARRIER_SHORT, 4);
}
//Sets bar preferences, 0 for long top, 1 for long bottom, 2 for short top, 3 for short bottom.
private static final Map<Character, Integer> barSizes = new HashMap<>();
static {
barSizes.put(B, 0);
barSizes.put(C, 2);
barSizes.put(D, 1);
barSizes.put(F, 2);
barSizes.put(G, 1);
barSizes.put(H, 1);
barSizes.put(J, 0);
barSizes.put(K, 2);
barSizes.put(L, 1);
barSizes.put(M, 0);
barSizes.put(N, 0);
barSizes.put(P, 3);
barSizes.put(Q, 3);
barSizes.put(R, 2);
barSizes.put(S, 1);
barSizes.put(T, 3);
barSizes.put(V, 0);
barSizes.put(W, 2);
barSizes.put(X, 0);
barSizes.put(Y, 2);
barSizes.put(Z, 1);
barSizes.put(S_ALT, 0);
barSizes.put(Z_ALT, 1);
barSizes.put(W_ALT, 2);
barSizes.put(R_ALT, 2);
barSizes.put(Y_ALT, 2);
}
//List of s-curls.
private static final List<Character> sCurls = new ArrayList<>();
static{
sCurls.add(S_CURL_1);
sCurls.add(S_CURL_2);
sCurls.add(S_CURL_3);
}
//List of carriers.
private static final List<Character> carriers = new ArrayList<>();
static {
carriers.add(CARRIER_LONG);
carriers.add(CARRIER_SHORT);
}
//List of bars.
private static final List<Character> bars = new ArrayList<>();
static {
bars.add(BAR_LONG_TOP);
bars.add(BAR_LONG_BOTTOM);
bars.add(BAR_SHORT_TOP);
bars.add(BAR_SHORT_BOTTOM);
}
/**
* Gives the properly sized vowel for a particular tengwar character.
* Uses indices from the charSizes map to find the proper character.
* @param tengwarChar tengwar char to be checked.
* @param englishVowel the english vowel type to be returned.
* @return tengwar vowel char corresponding to the letter, or default of left-most.
*/
private static char getAppropriateVowel(char tengwarChar, char englishVowel){
if (charSizes.containsKey(tengwarChar)){
return vowelChars.get(englishVowel)[charSizes.get(tengwarChar)-1];
} else {
return vowelChars.get(englishVowel)[0];
}
}
/**
* Gives the properly sized silent e vowel for a particular character.
* @param tengwarChar tengwar char to be checked.
* @return silent e vowel corresponding to the letter, or default of left-most.
*/
private static char getAppropriateSilentE(char tengwarChar){
if (tengwarChar == L){
return E_LAMBE;
}
if (charSizes.containsKey(tengwarChar)){
return vowelChars.get('e')[charSizes.get(tengwarChar)+3];
} else {
return vowelChars.get('e')[4];
}
}
/**
* Determines if a character is a vowel.
* @param c english character.
* @return true if vowel, false if not.
*/
private static boolean isVowel(char c){
return (c == 'a' || c == 'e' || c == 'i' || c == 'o' || c == 'u');
}
/**
* Determines if a tengwar character is a vowel.
* @param c tengwar char to check.
* @return true if vowel, false if not.
*/
private static boolean isVowelTengwar(char c){
for (Character[] ch : vowelChars.values()){
for (char cha : ch){
if (cha == c)
return true;
}
}
return false;
}
/**
* Returns the english vowel representation of a tengwar vowel.
* @param tengwarVowel The tengwar vowel to decipher.
* @return english vowel char.
*/
private static char getEnglishVowel(char tengwarVowel){
if (!isVowelTengwar(tengwarVowel)){
return 0;
}
for (Character[] ch : vowelChars.values()){
for (char cha : ch){
if (cha == tengwarVowel) {
return getKeyByValue(vowelChars, ch);
}
}
}
return 0;
}
/**
* Determines if a tengwar char is a silent E.
* @param tengwarChar the tengwar char to evaluate.
* @return True if it is a silent E, false otherwise.
*/
private static boolean isSilentE(char tengwarChar){
return tengwarChar == E_UNDER_1
|| tengwarChar == E_UNDER_2
|| tengwarChar == E_UNDER_3
|| tengwarChar == E_UNDER_4
|| tengwarChar == E_LAMBE;
}
/**
* Returns a character or string that is a literal translation from tengwar.
* @param tengwarChar the tengwar char to translate.
* @return english representation of the tengwar.
*/
private static String getEnglishLiteral(char tengwarChar){
if (consonantChars.containsValue(tengwarChar)){
return getKeyByValue(consonantChars, tengwarChar).toString();
} else if (compoundChars.containsValue(tengwarChar)){
return getKeyByValue(compoundChars, tengwarChar);
} else if (alternateChars.containsValue(tengwarChar)) {
return getKeyByValue(alternateChars, tengwarChar).toString();
} else if (tengwarChar == R_ALT){
return "r";
} else if (numberChars.containsValue(tengwarChar)){
return getKeyByValue(numberChars, tengwarChar).toString();
} else if (punctuationChars.containsValue(tengwarChar)){
return getKeyByValue(punctuationChars, tengwarChar).toString();
}
return null;
}
/**
* Returns the key for a specified value in a 1 to 1 map.
* @param map The 1 to 1 map to use.
* @param value Value to return the key of.
* @param <T> Key type of the map.
* @param <E> Value type of the map.
* @return Key associated with value.
*/
private static <T, E> T getKeyByValue(Map<T, E> map, E value) {
for (Map.Entry<T, E> entry : map.entrySet()) {
if (Objects.equals(value, entry.getValue())) {
return entry.getKey();
}
}
return null;
}
/**
* Translate an english string to tengwar.
* @param englishString english string.
* @return tengwar string.
*/
public static String translateToTengwar(String englishString){
StringBuilder result = new StringBuilder(englishString.length());
String input = englishString.toLowerCase().trim();
for (int i = 0; i < input.length(); i++){
//Attempt to get previous, current, and next char.
char currentChar = input.charAt(i);
char nextChar = 0;
try{
nextChar = input.charAt(i+1);
} catch (IndexOutOfBoundsException e){
//Do nothing, since this may happen.
}
//Test if the current char is a vowel.
if (isVowel(currentChar)){
if (consonantChars.containsKey(nextChar)){
//If the next character can have a vowel placed on it, then go here.
//Temporary storage for the character that will be added before the vowel.
char tengwarCharToBeAdded;
boolean needsBar = false;
char secondNextChar = 0;
//Check if the next char is a compound first.
try{
secondNextChar = input.charAt(i+2);
} catch (IndexOutOfBoundsException e){
//Do nothing. second next char doesn't exist.
}
if (compoundChars.containsKey(""+nextChar+secondNextChar)) {
tengwarCharToBeAdded = compoundChars.get("" + nextChar + secondNextChar);
i++;
} else if (alternateChars.containsKey(nextChar)){
//Not a compound, so now check for alternates.
tengwarCharToBeAdded = alternateChars.get(nextChar);
} else if (nextChar == 'r' && isVowel(secondNextChar)){
//Special case if there is an r next, with a vowel after it.
tengwarCharToBeAdded = R_ALT;
} else {
//Finally, add a literal consonant.
tengwarCharToBeAdded = consonantChars.get(nextChar);
}
//Check to see if a bar should be added, and the next character skipped.
if (nextChar == secondNextChar){
//Bar should be added.
needsBar = true;
i++;
}
result.append(tengwarCharToBeAdded);
result.append(getAppropriateVowel(tengwarCharToBeAdded, currentChar));
//Bar gets added after the vowel.
if (needsBar)
result.append(bars.get(barSizes.get(tengwarCharToBeAdded)));
i++;
} else {
//The next character is not able to have a vowel placed on it, so use a carrier.
if (currentChar == 'e' && (i == input.length()-1 || punctuationChars.containsKey(nextChar))){
//Use a silent e because the next char is a punctuation or the end of the string.
try{
result.append(getAppropriateSilentE(result.charAt(result.length()-1)));
} catch (IndexOutOfBoundsException e){
result.append(E_UNDER_1);
}
continue;
}
if (currentChar == nextChar){
//Add a long carrier, and skip the next character, because it is the same.
result.append(CARRIER_LONG);
result.append(getAppropriateVowel(CARRIER_LONG, currentChar));
i++;
} else {
//Add a short carrier.
result.append(CARRIER_SHORT);
result.append(getAppropriateVowel(CARRIER_SHORT, currentChar));
}
}
//Done with vowel checking.
} else {
//Character is not a vowel, so consonant, compound, number, or punctuation.
if (compoundChars.containsKey(""+currentChar+nextChar)){
//current char and next char are a compound, so add it and skip the next iteration.
result.append(compoundChars.get(""+currentChar+nextChar));
i++;
} else if (isVowel(nextChar) && currentChar == 'r') {
//Special case for r vowel.
result.append(R_ALT);
} else {
//Character can be literally translated from numbers or consonants or punctuation.
if (consonantChars.containsKey(currentChar)) {
result.append(consonantChars.get(currentChar));
if (currentChar == nextChar) {
//double consonant found, add a bar.
result.append(bars.get(barSizes.get(consonantChars.get(currentChar))));
i++;
}
} else if (punctuationChars.containsKey(currentChar)) {
result.append(punctuationChars.get(currentChar));
} else if (numberChars.containsKey(currentChar)) {
result.append(numberChars.get(currentChar));
}
}
}
}
return result.toString();
}
/**
* Translates a tengwar string to english.
* @param tengwarString tengwar string.
* @return english string.
*/
public static String translateToEnglish(String tengwarString){
StringBuilder result = new StringBuilder(tengwarString.length()+tengwarString.length()/2);
for (int i = 0; i < tengwarString.length(); i++){
char currentChar = tengwarString.charAt(i);
char nextChar = 0;
char secondNextChar = 0;
try{
nextChar = tengwarString.charAt(i+1);
} catch (IndexOutOfBoundsException e){
//Do nothing, this is fine.
}
try{
secondNextChar = tengwarString.charAt(i+2);
} catch (IndexOutOfBoundsException e){
//Do nothing, this is fine.
}
String currentLiteral = getEnglishLiteral(currentChar);
System.out.println("At: "+i+" Literal: "+currentLiteral);
//Check if the current character is a literal translation.
if (currentLiteral != null){
//Check if the next character is a vowel that should be placed before a character.
if (isVowelTengwar(nextChar) && !isSilentE(nextChar)){
result.append(getEnglishVowel(nextChar));
result.append(currentLiteral);
i++;
//Check for a double-bar, and then add whatever the current char is.
if (bars.contains(secondNextChar)){
result.append(currentLiteral);
i++;
}
} else if (bars.contains(nextChar)){
result.append(currentLiteral);
i++;
} else {
//Just append the current literal, no skipping.
result.append(currentLiteral);
}
} else {
//Current character is not a literal translation, so it is an E_UNDER, or carrier.
if (carriers.contains(currentChar)){
//If carrier, append the following vowel.
result.append(getEnglishVowel(nextChar));
i++;
} else if (isSilentE(currentChar)) {
result.append('e');
}
}
}
return result.toString();
}
}