[sword-svn] r255 - trunk/source/data/translit/crosswire

chrislit at crosswire.org chrislit at crosswire.org
Thu Feb 6 00:46:55 MST 2014


Author: chrislit
Date: 2014-02-06 00:46:55 -0700 (Thu, 06 Feb 2014)
New Revision: 255

Modified:
   trunk/source/data/translit/crosswire/Any_BetaCodeExtensions.txt
Log:
fixed all rule masking


Modified: trunk/source/data/translit/crosswire/Any_BetaCodeExtensions.txt
===================================================================
--- trunk/source/data/translit/crosswire/Any_BetaCodeExtensions.txt	2014-02-06 06:10:48 UTC (rev 254)
+++ trunk/source/data/translit/crosswire/Any_BetaCodeExtensions.txt	2014-02-06 07:46:55 UTC (rev 255)
@@ -12,132 +12,10 @@
 # Any-BetaCodeExtensions
 :: NFD (NFC);
 
-# Additional Punctuation and Characters
-\;<\%100;
-\#<>\%101;
-‘<\%102;
-\\<>\%103;
-\^<>\%104;
-\|\|\|<>\%105;
-≌<>\%106;
-\~<>\%107;
-±<>\%108;
-·<\%109;
-○<>\%110;
-̯<>\%127;
-̂<>\%128;
-†<>\%129;
-̇<\%130;
-΅<>\%132;
-῍<>\%133;
-῏<>\%134;
-⏑́<>\%138;
-# %139 unencodable: idiosyn
-𐄒<>\%140;
-⏖<>\%141;
-┐<>\%142;
-⏑̶<>\%144;
-–́<>\%145;
-·<\%146;
-̊<\%147;
-̌<>\%148;
-̨<>\%149;
-\|<\%150;
-# %151-%153 unencodable: non-TLG
-∴<>\%154;
-∵<>\%155;
-⸸<>\%157;
-⁂<>\%158;
-×<>\%159;
-\-<>\%160;
-÷<>\%161;
-̸<>\%162;
-¶<>\%163;
-͙<>\%170;
-\/\/<>\%171;
-ʼ<>\%172;
-ʽ<>\%173;
-´<>\%174;
-\`<>\%175;
-῀<>\%176;
-̓<>\%177;
-̔<>\%178;
-̣<>\%179;
-̽<>\%180;
-̭<>\%181;
-͡<>\%182;
-͝<>\%183;
-͞<>\%184;
-⌙<>\%185;
-𝉂<>\%186;
-¬<>\%187;
-̚<>\%188;
+# priority mappings to avoid masking
+̣̣>\%29;
+\/\/>\%171;
 
-\:<>\%10;
-•<>\%11;
-\*<>\%12;
-‡<>\%13;
-§<>\%14;
-ˈ<>\%15;
-¦<>\%16;
-‖<>\%17;
-\'<\%18;
-–<\%19;
-́<>\%20;
-̀<>\%21;
-̂<>\%22;
-̈<>\%23;
-͂<>\%24;
-̧<>\%25;
-̄<>\%26;
-̆<>\%27;
-̈<\%28;
-̣̣<>\%29;
-ʼ<>\%30;
-ʽ<>\%31;
-´<>\%32;
-\`<>\%33;
-῀<>\%34;
-῎<>\%35;
-῞<>\%36;
-῝<>\%37;
-῟<>\%38;
-¨<>\%39;
-⏑<>\%40;
-–<>\%41;
-⏕<>\%42;
-×<>\%43;
-⏒<>\%44;
-⏓<>\%45;
-⏔<>\%46;
-𐄑<>\%47;
-# %48-%49 unencodable: markup
-# %50-%65 unencodable: non-TLG
-β̸<\%69;
-# %70-%73 unencodable: non-TLG
-# %80-%81 unencodable: markup
-҅<>\%91;
-҆<>\%92;
-᷀<>\%93;
-̇<>\%94;
-᷁<>\%95;
-͜<>\%96;
-̈<>\%97;
-\"<>\%98;
-≈<>\%99;
-
-\?<>\%1;
-\*<>\%2;
-\/<>\%3;
-\!<>\%4;
-\|<>\%5;
-\=<>\%6;
-\+<>\%7;
-\%<>\%8;
-\&<>\%9;
-
-†<>\%;
-
 # Byzantine Musical Notation
 𝀀<>\#2000;
 𝀁<>\#2001;
@@ -398,7 +276,7 @@
 #            Further Abbreviations 
 
 𐅼<\#1000;
-𐅽<>\#1001;
+𐅽<\#1001;
 𐅾<>\#1002;
 𐅿<>\#1003;
 𐆀<>\#1004;
@@ -474,7 +352,7 @@
 n̊<>\#1314;
 # #1315 unencodable: abbr
 ʒ<>\#1316;
-˙\/\/.<>\#1317;
+˙\/\/\.<>\#1317;
 ∻<\#1318;
 # #1319 unencodable: idiosyn
 ͵̑<>\#1320;
@@ -485,7 +363,7 @@
 # #1325-#1328,#1334 unencodable: idiosyn
 \/\/<\#1335;
 # #1336 unencodable: idiosyn
-\><>\#1337;
+\><\#1337;
 𐅾<\#1338;
 # #1340 unencodable: markup
 # #1341 unencodable: idiosyn
@@ -497,13 +375,13 @@
 # #1505 unencodable: abbr
 ̀̌<>\#1506;
 # #1509-#1511 unencodable: abbr
-\<<>\#1512;
-𐅵<>\#1513;
-÷<>\#1514;
+\<<\#1512;
+𐅵<\#1513;
+÷<\#1514;
 𝈏<>\#1515;
 # #1516 unencodable: idiosyn
 # #1517 unencodable: rare
-𝈩<>\#1518;
+𝈩<\#1518;
 # #1519 unencodable: idiosyn
 # #1520 unencodable: abbr
 Ȣ<>\#1521;
@@ -554,7 +432,7 @@
 𐅁<>\#801;
 𐅀<\#802;
 Χ<\#803;
-\/<>\#804;
+\/<\#804;
 Τ<\#805;
 Κ<\#806;
 𐅦<>\#807;
@@ -591,7 +469,7 @@
 \|\|<>\#840;
 ·<\#842;
 𐅛<>\#843;
-⁝<>\#844;
+⁝<\#844;
 𐅘<>\#845;
 𐄐<>\#846;
 𐅞<>\#847;
@@ -602,7 +480,7 @@
 𐅄<\#863;
 𐅅<\#865;
 Χ<\#866;
-𐅆<>\#867;
+𐅆<\#867;
 # #899 unencodable: idiosyn
 ᴨ<\#922;
 # #923-#924 unencodable: idiosyn
@@ -612,13 +490,13 @@
 𝈋<\#928;
 𝈔<\#929;
 # #930 unencodable: idiosyn
-✳<>\#932;
+✳<\#932;
 # #933-#934,#936 unencodable: idiosyn
 # #937 unencodable: non-TLG
-Ƨ<>\#938;
+Ƨ<\#938;
 \~<\#939;
 # #940 unencodable: idiosyn
-𝈅<>\#941;
+𝈅<\#941;
 # #980 unencodable: idiosyn
 
 # #400-#699
@@ -628,12 +506,12 @@
 
 Ͱ<>\*\#400;
 ͱ<>\#400;
-ʃ<>\#451;
+ʃ<\#451;
 ⸐<\#452;
 ⸑<>\#453;
 ⸐<\#454;
 ⸑<\#455;
-⸎<>\#456;
+⸎<\#456;
 # #457 unencodable: idiosyn
 Χ<\#458;
 ·<\#459;
@@ -642,7 +520,7 @@
 ☧<>\#465;
 # #466 unencodable: idiosyn
 \→<>\#467;
-⸎<>\#468;
+⸎<\#468;
 ʃ<>\#476;
 # #501 unencodable: abbr
 # #502 unencodable: idiosyn
@@ -667,7 +545,7 @@
 ⸓<>\#523;
 ⊗<>\#524;
 ✛<>\#525;
-←<>\#526;
+\←<>\#526;
 ˆ<\#527;
 λ̭<\#528;
 ⁋<>\#529;
@@ -701,7 +579,7 @@
 𝈳<>\#568;
 𝈶<>\#569;
 Ϲ<\#570;
-𐅃<>\#571;
+𐅃<\#571;
 𝈩<>\#572;
 𝈒<>\#573;
 Γ<\#574;
@@ -742,7 +620,7 @@
 𝈅<>\#621;
 𝈁<>\#622;
 ℧<\#623;
-Ͻ<>\#624;
+Ͻ<\#624;
 # #625-#626 unencodable: rare
 𝈗<>\#627;
 Ο<\#628;
@@ -767,7 +645,7 @@
 𝈬<>\#647;
 𝈵<>\#648;
 𝈋<>\#649;
-𝈏<>\#650;
+𝈻<>\#650;
 Χ<\#651;
 Τ<\#652;
 𝈙<>\#653;
@@ -840,8 +718,8 @@
 𐅽<>\#119;
 𐆄<\#120;
 ξ̸<\#121;
-𐅽<>\#122;
-𐅼<>\#123;
+𐅽<\#122;
+𐅼<\#123;
 # #124 unencodable: idiosyn
 # #125 unencodable: markup
 # #126 unencodable: idiosyn
@@ -914,7 +792,7 @@
 # #300 unencodable: rare
 # #301 unencodable: markup
 # #302 unencodable: idiosyn
-\><>\#303;
+\><\#303;
 # #304 unencodable: rare
 ⸎<\#305;
 # #306-#308 unencodable: rare
@@ -927,17 +805,17 @@
 ●<\#319;
 ☩<\#320;
 ☩<\#321;
-☧<>\#322;
-\><>\#323;
+☧<\#322;
+\><\#323;
 # #324-#337 unencodable: non-TLG
 
 Ͻ<>\#10;
 Ͽ<>\#11;
-—<>\#12;
+𝈏<\#12;
 ※<>\#13;
 ⸖<>\#14;
 \><>\#15;
-?<>\#16;
+Ͼ<>\#16;
 \/<>\#17;
 \<<>\#18;
 ̀<\#19;
@@ -967,12 +845,12 @@
 Χ<>\#67;
 𐅆<>\#68;
 Μ<\#69;
-.<\#70;
+\.<\#70;
 ·<\#71;
 ˙<>\#72;
 ⁚<>\#73;
 ⁝<>\#74;
-.<\#75;
+\.<\#75;
 ̈<\#80;
 \'<\#81;
 ˊ<\#82;
@@ -999,5 +877,132 @@
 
 ʹ<>\#;
 
-:: NFC ()
+# Additional Punctuation and Characters
+
+\;<\%100;
+\#<>\%101;
+‘<\%102;
+\\<>\%103;
+\^<>\%104;
+\|\|\|<\%105;
+≌<>\%106;
+\~<>\%107;
+±<>\%108;
+·<\%109;
+○<>\%110;
+̯<>\%127;
+̂<>\%128;
+†<\%129;
+̇<\%130;
+΅<>\%132;
+῍<>\%133;
+῏<>\%134;
+⏑́<>\%138;
+# %139 unencodable: idiosyn
+𐄒<\%140;
+⏖<>\%141;
+┐<>\%142;
+⏑̶<>\%144;
+–́<>\%145;
+·<\%146;
+̊<\%147;
+̌<>\%148;
+̨<>\%149;
+\|<\%150;
+# %151-%153 unencodable: non-TLG
+∴<>\%154;
+∵<>\%155;
+⸸<>\%157;
+⁂<>\%158;
+×<\%159;
+\-<>\%160;
+÷<>\%161;
+̸<>\%162;
+¶<>\%163;
+͙<>\%170;
+\/\/<\%171;
+ʼ<\%172;
+ʽ<\%173;
+´<\%174;
+\`<\%175;
+῀<\%176;
+̓<>\%177;
+̔<>\%178;
+̣<>\%179;
+̽<>\%180;
+̭<>\%181;
+͡<>\%182;
+͝<>\%183;
+͞<>\%184;
+⌙<>\%185;
+𝉂<\%186;
+¬<>\%187;
+̚<>\%188;
+
+\:<>\%10;
+•<>\%11;
+\*<\%12;
+‡<>\%13;
+§<>\%14;
+ˈ<>\%15;
+¦<>\%16;
+‖<>\%17;
+\'<\%18;
+–<\%19;
+́<>\%20;
+̀<>\%21;
+̂<\%22;
+̈<\%23;
+͂<>\%24;
+̧<>\%25;
+̄<>\%26;
+̆<>\%27;
+̈<\%28;
+̣̣<\%29;
+ʼ<>\%30;
+ʽ<>\%31;
+´<>\%32;
+\`<>\%33;
+῀<>\%34;
+῎<>\%35;
+῞<>\%36;
+῝<>\%37;
+῟<>\%38;
+¨<>\%39;
+⏑<>\%40;
+–<>\%41;
+⏕<>\%42;
+×<>\%43;
+⏒<>\%44;
+⏓<>\%45;
+⏔<>\%46;
+𐄑<>\%47;
+# %48-%49 unencodable: markup
+# %50-%65 unencodable: non-TLG
+β̸<\%69;
+# %70-%73 unencodable: non-TLG
+# %80-%81 unencodable: markup
+҅<>\%91;
+҆<>\%92;
+᷀<>\%93;
+̇<>\%94;
+᷁<>\%95;
+͜<>\%96;
+̈<>\%97;
+\"<>\%98;
+≈<>\%99;
+
+\?<>\%1;
+\*<>\%2;
+\/<\%3;
+\!<>\%4;
+\|<>\%5;
+\=<>\%6;
+\+<>\%7;
+\%<>\%8;
+\&<>\%9;
+
+†<>\%;
+
+:: NFC ();
 :: ([\*\#%0-9]);




More information about the sword-cvs mailing list