[sword-svn] r256 - trunk/source/data/translit/crosswire
chrislit at crosswire.org
chrislit at crosswire.org
Thu Feb 6 01:26:30 MST 2014
Author: chrislit
Date: 2014-02-06 01:26:30 -0700 (Thu, 06 Feb 2014)
New Revision: 256
Modified:
trunk/source/data/translit/crosswire/Greek_Latin_Beta.txt
Log:
updated, checked, tested Greek/Beta transliterator
Modified: trunk/source/data/translit/crosswire/Greek_Latin_Beta.txt
===================================================================
--- trunk/source/data/translit/crosswire/Greek_Latin_Beta.txt 2014-02-06 07:46:55 UTC (rev 255)
+++ trunk/source/data/translit/crosswire/Greek_Latin_Beta.txt 2014-02-06 08:26:30 UTC (rev 256)
@@ -1,6 +1,6 @@
# ***************************************************************************
# *
-# * Copyright (C) 2002-2013, CrossWire Bible Society
+# * Copyright (C) 2002-2014, CrossWire Bible Society
# * All Rights Reserved.
# *
# ***************************************************************************
@@ -9,39 +9,55 @@
# Based on Beta code for CCAT/CATSS/TLG:
# http://ccat.sas.upenn.edu/gopher/text/religion/biblical/0-betacode.txt
+# and:
+# http://www.tlg.uci.edu/encoding/BCM2013.pdf
+
# Greek-Latin/Beta
+:: [[:Greek:][̓ʼ᾽᾿̔ʽ῞´ˊ΄´͂̂\^ˆ῀̀\`ˋ`̈¨ͅιͺ̣··;’‐—]];
:: NFD (NFC);
-:: [:Greek:] upper();
-# Uppercase
-Α<>'*A';
-Β<>'*B';
-Γ<>'*G';
-Δ<>'*D';
-Ε<>'*E';
-Ζ<>'*Z';
-Η<>'*H';
-Θ<>'*Q';
-Ι<>'*I';
-Κ<>'*K';
-Λ<>'*L';
-Μ<>'*M';
-Ν<>'*N';
-Ξ<>'*C';
-Ο<>'*O';
-Φ<>'*F';
-Ψ<>'*Y';
-Π<>'*P';
-Ρ<>'*R';
-Σ<>'*S';
-Τ<>'*T';
-Υ<>'*U';
-Χ<>'*X';
-Ω<>'*W';
-# Archaic
-Ϝ<>'*V';
-Ϟ<>'*#3';
-Ϡ<>'*#5';
-# Lowercase
+
+$betaMarks = [|():/=\\+_];
+
+|\*$2$1<\*($betaMarks)([A-Z]);
+|$2$1<[A-Z]{($betaMarks)([A-Z]);
+
+# Letters
+# Uppercase
+Α<>\*A;
+Β<>\*B;
+Γ<>\*G;
+Δ<>\*D;
+Ε<>\*E;
+Ζ<>\*Z;
+Η<>\*H;
+Θ<>\*Q;
+Ι<>\*I;
+Κ<>\*K;
+Λ<>\*L;
+Μ<>\*M;
+Ν<>\*N;
+Ξ<>\*C;
+Ο<>\*O;
+Φ<>\*F;
+Ψ<>\*Y;
+Π<>\*P;
+Ρ<>\*R;
+Ϲ<>\*S3;
+Σ<\*S1;
+Σ<\*S2;
+Σ<\*J;
+Σ<>\*S;
+Τ<>\*T;
+Υ<>\*U;
+Χ<>\*X;
+Ω<>\*W;
+
+# Uppercase Archaic
+Ϝ<>\*V;
+Ϟ<>\*\#3;
+Ϡ<>\*\#5;
+
+# Lowercase
α<>A;
β<>B;
γ<>G;
@@ -61,37 +77,75 @@
ψ<>Y;
π<>P;
ρ<>R;
-ς<>J;
+ϲ<S3;
+ς<S2;
+ς<J;
+ς>S;
+σ<S1;
+ς<S}[^[:L:][:M:]];
σ<>S;
τ<>T;
υ<>U;
χ<>X;
ω<>W;
-# Archaic
+
+# Lowercase Archaic
ϝ<>V;
-ϟ<>'#3';
-ϡ<>'#5';
+ϟ<>\#3;
+ϡ<>\#5;
+
# Non-letter characters
-ͅ<>'|';
-ͺ>'|';
-̔<>'(';
-ʽ>'(';
-·<>':';
-̓<>')';
-ʼ>')';
-́<>'/';
-´>'/';
-ˊ>'/';
-΄>'/';
-͂<>'=';
-̂>'=';
-'^'>'=';
-ˆ>'=';
-̀<>'\\';
-'`'>'\\';
-ˋ>'\\';
-̈<>'+';
-¨>'+';
-̄<>'_'; # Perseus LSJ uses _ for long vowels
+# smooth breathing
+̓<>\);
+ʼ>\);
+᾽>\);
+᾿>\);
+# rough breathing
+̔<>\(;
+ʽ>\(;
+῾>\(;
+# accent acute
+́<>\/;
+´>\/;
+ˊ>\/;
+΄>\/;
+´>\/;
+# circumflex
+͂<>\=;
+̂>\=;
+\^>\=;
+ˆ>\=;
+῀>\=;
+# accent grave
+̀<>\\;
+\`>\\;
+ˋ>\\;
+`>\\;
+# diaeresis
+̈<>\+;
+¨>\+;
+# iota subscript
+ͅ<>\|;
+ι>\|;
+ͺ>\|;
+# dot below
+̣<\?;
+
+# ignore period & comma
+
+# middle dot
+·<>\:;
+·>\:;
+# semicolon (question mark) -- use a semicolon in both scripts
+;>\;;
+# apostrophe
+’<>\';
+# hyphen
+‐<>\-;
+—<>\_;
+
+# ̄<>\_; # Perseus LSJ uses _ for long vowels
+
:: ([a-z] upper);
:: NFC (NFD);
+:: ([\*A-Za-z\#%0-9\)\(\/\=\\\+\|\?\:\;\'\-\_]);
More information about the sword-cvs
mailing list