diff options
Diffstat (limited to 'src/chrtrans')
-rw-r--r-- | src/chrtrans/README.format | 4 | ||||
-rw-r--r-- | src/chrtrans/cp1250_uni.tbl | 10 | ||||
-rw-r--r-- | src/chrtrans/cp1253_uni.tbl | 34 | ||||
-rw-r--r-- | src/chrtrans/cp1255_uni.tbl | 46 | ||||
-rw-r--r-- | src/chrtrans/cp1256_uni.tbl | 16 | ||||
-rw-r--r-- | src/chrtrans/cp1257_uni.tbl | 24 |
6 files changed, 69 insertions, 65 deletions
diff --git a/src/chrtrans/README.format b/src/chrtrans/README.format index 5e8d029c..636afd32 100644 --- a/src/chrtrans/README.format +++ b/src/chrtrans/README.format @@ -82,6 +82,10 @@ c) character translation definitions: * where <range> ::= <fontpos>-<fontpos> * and <unicode> ::= U+<h><h><h><h> * and <h> ::= <hexadecimal digit> + * + [Note that <fontpos> _without_ targets assumed notdefined, + so tables from ftp.unicode.org need no patching.] + d) string replacement definitions: diff --git a/src/chrtrans/cp1250_uni.tbl b/src/chrtrans/cp1250_uni.tbl index a6852cfa..e7b19995 100644 --- a/src/chrtrans/cp1250_uni.tbl +++ b/src/chrtrans/cp1250_uni.tbl @@ -27,14 +27,14 @@ OWinLatin2 (cp1250) 0x20-0x7e idem # 0x80 U+20AC #EURO SIGN -#0x81 #UNDEFINED +0x81 #UNDEFINED 0x82 U+201A #SINGLE LOW-9 QUOTATION MARK -#0x83 #UNDEFINED +0x83 #UNDEFINED 0x84 U+201E #DOUBLE LOW-9 QUOTATION MARK 0x85 U+2026 #HORIZONTAL ELLIPSIS 0x86 U+2020 #DAGGER 0x87 U+2021 #DOUBLE DAGGER -#0x88 #UNDEFINED +0x88 #UNDEFINED 0x89 U+2030 #PER MILLE SIGN 0x8A U+0160 #LATIN CAPITAL LETTER S WITH CARON 0x8B U+2039 #SINGLE LEFT-POINTING ANGLE QUOTATION MARK @@ -42,7 +42,7 @@ OWinLatin2 (cp1250) 0x8D U+0164 #LATIN CAPITAL LETTER T WITH CARON 0x8E U+017D #LATIN CAPITAL LETTER Z WITH CARON 0x8F U+0179 #LATIN CAPITAL LETTER Z WITH ACUTE -#0x90 #UNDEFINED +0x90 #UNDEFINED 0x91 U+2018 #LEFT SINGLE QUOTATION MARK 0x92 U+2019 #RIGHT SINGLE QUOTATION MARK 0x93 U+201C #LEFT DOUBLE QUOTATION MARK @@ -50,7 +50,7 @@ OWinLatin2 (cp1250) 0x95 U+2022 #BULLET 0x96 U+2013 #EN DASH 0x97 U+2014 #EM DASH -#0x98 #UNDEFINED +0x98 #UNDEFINED 0x99 U+2122 #TRADE MARK SIGN 0x9A U+0161 #LATIN SMALL LETTER S WITH CARON 0x9B U+203A #SINGLE RIGHT-POINTING ANGLE QUOTATION MARK diff --git a/src/chrtrans/cp1253_uni.tbl b/src/chrtrans/cp1253_uni.tbl index dac37990..ed50b1ed 100644 --- a/src/chrtrans/cp1253_uni.tbl +++ b/src/chrtrans/cp1253_uni.tbl @@ -27,22 +27,22 @@ OWinGreek (cp1253) 0x20-0x7e idem # 0x80 U+20AC #EURO SIGN -#0x81 #UNDEFINED +0x81 #UNDEFINED 0x82 U+201A #SINGLE LOW-9 QUOTATION MARK 0x83 U+0192 #LATIN SMALL LETTER F WITH HOOK 0x84 U+201E #DOUBLE LOW-9 QUOTATION MARK 0x85 U+2026 #HORIZONTAL ELLIPSIS 0x86 U+2020 #DAGGER 0x87 U+2021 #DOUBLE DAGGER -#0x88 #UNDEFINED +0x88 #UNDEFINED 0x89 U+2030 #PER MILLE SIGN -#0x8A #UNDEFINED +0x8A #UNDEFINED 0x8B U+2039 #SINGLE LEFT-POINTING ANGLE QUOTATION MARK -#0x8C #UNDEFINED -#0x8D #UNDEFINED -#0x8E #UNDEFINED -#0x8F #UNDEFINED -#0x90 #UNDEFINED +0x8C #UNDEFINED +0x8D #UNDEFINED +0x8E #UNDEFINED +0x8F #UNDEFINED +0x90 #UNDEFINED 0x91 U+2018 #LEFT SINGLE QUOTATION MARK 0x92 U+2019 #RIGHT SINGLE QUOTATION MARK 0x93 U+201C #LEFT DOUBLE QUOTATION MARK @@ -50,14 +50,14 @@ OWinGreek (cp1253) 0x95 U+2022 #BULLET 0x96 U+2013 #EN DASH 0x97 U+2014 #EM DASH -#0x98 #UNDEFINED +0x98 #UNDEFINED 0x99 U+2122 #TRADE MARK SIGN -#0x9A #UNDEFINED +0x9A #UNDEFINED 0x9B U+203A #SINGLE RIGHT-POINTING ANGLE QUOTATION MARK -#0x9C #UNDEFINED -#0x9D #UNDEFINED -#0x9E #UNDEFINED -#0x9F #UNDEFINED +0x9C #UNDEFINED +0x9D #UNDEFINED +0x9E #UNDEFINED +0x9F #UNDEFINED 0xA0 U+00A0 #NO-BREAK SPACE 0xA1 U+0385 #GREEK DIALYTIKA TONOS 0xA2 U+0386 #GREEK CAPITAL LETTER ALPHA WITH TONOS @@ -68,7 +68,7 @@ OWinGreek (cp1253) 0xA7 U+00A7 #SECTION SIGN 0xA8 U+00A8 #DIAERESIS 0xA9 U+00A9 #COPYRIGHT SIGN -#0xAA #UNDEFINED +0xAA #UNDEFINED 0xAB U+00AB #LEFT-POINTING DOUBLE ANGLE QUOTATION MARK 0xAC U+00AC #NOT SIGN 0xAD U+00AD #SOFT HYPHEN @@ -108,7 +108,7 @@ OWinGreek (cp1253) 0xCF U+039F #GREEK CAPITAL LETTER OMICRON 0xD0 U+03A0 #GREEK CAPITAL LETTER PI 0xD1 U+03A1 #GREEK CAPITAL LETTER RHO -#0xD2 #UNDEFINED +0xD2 #UNDEFINED 0xD3 U+03A3 #GREEK CAPITAL LETTER SIGMA 0xD4 U+03A4 #GREEK CAPITAL LETTER TAU 0xD5 U+03A5 #GREEK CAPITAL LETTER UPSILON @@ -153,4 +153,4 @@ OWinGreek (cp1253) 0xFC U+03CC #GREEK SMALL LETTER OMICRON WITH TONOS 0xFD U+03CD #GREEK SMALL LETTER UPSILON WITH TONOS 0xFE U+03CE #GREEK SMALL LETTER OMEGA WITH TONOS -#0xFF #UNDEFINED +0xFF #UNDEFINED diff --git a/src/chrtrans/cp1255_uni.tbl b/src/chrtrans/cp1255_uni.tbl index a30d9a7d..67517353 100644 --- a/src/chrtrans/cp1255_uni.tbl +++ b/src/chrtrans/cp1255_uni.tbl @@ -27,7 +27,7 @@ OWinHebrew (cp1255) 0x20-0x7e idem # 0x80 U+20AC #EURO SIGN -#0x81 #UNDEFINED +0x81 #UNDEFINED 0x82 U+201A #SINGLE LOW-9 QUOTATION MARK 0x83 U+0192 #LATIN SMALL LETTER F WITH HOOK 0x84 U+201E #DOUBLE LOW-9 QUOTATION MARK @@ -36,13 +36,13 @@ OWinHebrew (cp1255) 0x87 U+2021 #DOUBLE DAGGER 0x88 U+02C6 #MODIFIER LETTER CIRCUMFLEX ACCENT 0x89 U+2030 #PER MILLE SIGN -#0x8A #UNDEFINED +0x8A #UNDEFINED 0x8B U+2039 #SINGLE LEFT-POINTING ANGLE QUOTATION MARK -#0x8C #UNDEFINED -#0x8D #UNDEFINED -#0x8E #UNDEFINED -#0x8F #UNDEFINED -#0x90 #UNDEFINED +0x8C #UNDEFINED +0x8D #UNDEFINED +0x8E #UNDEFINED +0x8F #UNDEFINED +0x90 #UNDEFINED 0x91 U+2018 #LEFT SINGLE QUOTATION MARK 0x92 U+2019 #RIGHT SINGLE QUOTATION MARK 0x93 U+201C #LEFT DOUBLE QUOTATION MARK @@ -52,12 +52,12 @@ OWinHebrew (cp1255) 0x97 U+2014 #EM DASH 0x98 U+02DC #SMALL TILDE 0x99 U+2122 #TRADE MARK SIGN -#0x9A #UNDEFINED +0x9A #UNDEFINED 0x9B U+203A #SINGLE RIGHT-POINTING ANGLE QUOTATION MARK -#0x9C #UNDEFINED -#0x9D #UNDEFINED -#0x9E #UNDEFINED -#0x9F #UNDEFINED +0x9C #UNDEFINED +0x9D #UNDEFINED +0x9E #UNDEFINED +0x9F #UNDEFINED 0xA0 U+00A0 #NO-BREAK SPACE 0xA1 U+00A1 #INVERTED EXCLAMATION MARK 0xA2 U+00A2 #CENT SIGN @@ -100,7 +100,7 @@ OWinHebrew (cp1255) 0xC7 U+05B7 #HEBREW POINT PATAH 0xC8 U+05B8 #HEBREW POINT QAMATS 0xC9 U+05B9 #HEBREW POINT HOLAM -#0xCA #UNDEFINED +0xCA #UNDEFINED 0xCB U+05BB #HEBREW POINT QUBUTS 0xCC U+05BC #HEBREW POINT DAGESH OR MAPIQ 0xCD U+05BD #HEBREW POINT METEG @@ -115,13 +115,13 @@ OWinHebrew (cp1255) 0xD6 U+05F2 #HEBREW LIGATURE YIDDISH DOUBLE YOD 0xD7 U+05F3 #HEBREW PUNCTUATION GERESH 0xD8 U+05F4 #HEBREW PUNCTUATION GERSHAYIM -#0xD9 #UNDEFINED -#0xDA #UNDEFINED -#0xDB #UNDEFINED -#0xDC #UNDEFINED -#0xDD #UNDEFINED -#0xDE #UNDEFINED -#0xDF #UNDEFINED +0xD9 #UNDEFINED +0xDA #UNDEFINED +0xDB #UNDEFINED +0xDC #UNDEFINED +0xDD #UNDEFINED +0xDE #UNDEFINED +0xDF #UNDEFINED 0xE0 U+05D0 #HEBREW LETTER ALEF 0xE1 U+05D1 #HEBREW LETTER BET 0xE2 U+05D2 #HEBREW LETTER GIMEL @@ -149,8 +149,8 @@ OWinHebrew (cp1255) 0xF8 U+05E8 #HEBREW LETTER RESH 0xF9 U+05E9 #HEBREW LETTER SHIN 0xFA U+05EA #HEBREW LETTER TAV -#0xFB #UNDEFINED -#0xFC #UNDEFINED +0xFB #UNDEFINED +0xFC #UNDEFINED 0xFD U+200E #LEFT-TO-RIGHT MARK 0xFE U+200F #RIGHT-TO-LEFT MARK -#0xFF #UNDEFINED +0xFF #UNDEFINED diff --git a/src/chrtrans/cp1256_uni.tbl b/src/chrtrans/cp1256_uni.tbl index 0e045aaa..844e450d 100644 --- a/src/chrtrans/cp1256_uni.tbl +++ b/src/chrtrans/cp1256_uni.tbl @@ -36,12 +36,12 @@ OWinArabic (cp1256) 0x87 U+2021 #DOUBLE DAGGER 0x88 U+02C6 #MODIFIER LETTER CIRCUMFLEX ACCENT 0x89 U+2030 #PER MILLE SIGN -#0x8A #UNDEFINED +0x8A #UNDEFINED 0x8B U+2039 #SINGLE LEFT-POINTING ANGLE QUOTATION MARK 0x8C U+0152 #LATIN CAPITAL LIGATURE OE 0x8D U+0686 #ARABIC LETTER TCHEH 0x8E U+0698 #ARABIC LETTER JEH -#0x8F #UNDEFINED +0x8F #UNDEFINED 0x90 U+06AF #ARABIC LETTER GAF 0x91 U+2018 #LEFT SINGLE QUOTATION MARK 0x92 U+2019 #RIGHT SINGLE QUOTATION MARK @@ -50,14 +50,14 @@ OWinArabic (cp1256) 0x95 U+2022 #BULLET 0x96 U+2013 #EN DASH 0x97 U+2014 #EM DASH -#0x98 #UNDEFINED +0x98 #UNDEFINED 0x99 U+2122 #TRADE MARK SIGN -#0x9A #UNDEFINED +0x9A #UNDEFINED 0x9B U+203A #SINGLE RIGHT-POINTING ANGLE QUOTATION MARK 0x9C U+0153 #LATIN SMALL LIGATURE OE 0x9D U+200C #ZERO WIDTH NON-JOINER 0x9E U+200D #ZERO WIDTH JOINER -#0x9F #UNDEFINED +0x9F #UNDEFINED 0xA0 U+00A0 #NO-BREAK SPACE 0xA1 U+060C #ARABIC COMMA 0xA2 U+00A2 #CENT SIGN @@ -68,7 +68,7 @@ OWinArabic (cp1256) 0xA7 U+00A7 #SECTION SIGN 0xA8 U+00A8 #DIAERESIS 0xA9 U+00A9 #COPYRIGHT SIGN -#0xAA #UNDEFINED +0xAA #UNDEFINED 0xAB U+00AB #LEFT-POINTING DOUBLE ANGLE QUOTATION MARK 0xAC U+00AC #NOT SIGN 0xAD U+00AD #SOFT HYPHEN @@ -90,7 +90,7 @@ OWinArabic (cp1256) 0xBD U+00BD #VULGAR FRACTION ONE HALF 0xBE U+00BE #VULGAR FRACTION THREE QUARTERS 0xBF U+061F #ARABIC QUESTION MARK -#0xC0 #UNDEFINED +0xC0 #UNDEFINED 0xC1 U+0621 #ARABIC LETTER HAMZA 0xC2 U+0622 #ARABIC LETTER ALEF WITH MADDA ABOVE 0xC3 U+0623 #ARABIC LETTER ALEF WITH HAMZA ABOVE @@ -153,4 +153,4 @@ OWinArabic (cp1256) 0xFC U+00FC #LATIN SMALL LETTER U WITH DIAERESIS 0xFD U+200E #LEFT-TO-RIGHT MARK 0xFE U+200F #RIGHT-TO-LEFT MARK -#0xFF #UNDEFINED +0xFF #UNDEFINED diff --git a/src/chrtrans/cp1257_uni.tbl b/src/chrtrans/cp1257_uni.tbl index 8e830cd5..5339fa7c 100644 --- a/src/chrtrans/cp1257_uni.tbl +++ b/src/chrtrans/cp1257_uni.tbl @@ -27,22 +27,22 @@ OWinBaltRim (cp1257) 0x20-0x7e idem # 0x80 U+20AC #EURO SIGN -#0x81 #UNDEFINED +0x81 #UNDEFINED 0x82 U+201A #SINGLE LOW-9 QUOTATION MARK -#0x83 #UNDEFINED +0x83 #UNDEFINED 0x84 U+201E #DOUBLE LOW-9 QUOTATION MARK 0x85 U+2026 #HORIZONTAL ELLIPSIS 0x86 U+2020 #DAGGER 0x87 U+2021 #DOUBLE DAGGER -#0x88 #UNDEFINED +0x88 #UNDEFINED 0x89 U+2030 #PER MILLE SIGN -#0x8A #UNDEFINED +0x8A #UNDEFINED 0x8B U+2039 #SINGLE LEFT-POINTING ANGLE QUOTATION MARK -#0x8C #UNDEFINED +0x8C #UNDEFINED 0x8D U+00A8 #DIAERESIS 0x8E U+02C7 #CARON 0x8F U+00B8 #CEDILLA -#0x90 #UNDEFINED +0x90 #UNDEFINED 0x91 U+2018 #LEFT SINGLE QUOTATION MARK 0x92 U+2019 #RIGHT SINGLE QUOTATION MARK 0x93 U+201C #LEFT DOUBLE QUOTATION MARK @@ -50,20 +50,20 @@ OWinBaltRim (cp1257) 0x95 U+2022 #BULLET 0x96 U+2013 #EN DASH 0x97 U+2014 #EM DASH -#0x98 #UNDEFINED +0x98 #UNDEFINED 0x99 U+2122 #TRADE MARK SIGN -#0x9A #UNDEFINED +0x9A #UNDEFINED 0x9B U+203A #SINGLE RIGHT-POINTING ANGLE QUOTATION MARK -#0x9C #UNDEFINED +0x9C #UNDEFINED 0x9D U+00AF #MACRON 0x9E U+02DB #OGONEK -#0x9F #UNDEFINED +0x9F #UNDEFINED 0xA0 U+00A0 #NO-BREAK SPACE -#0xA1 #UNDEFINED +0xA1 #UNDEFINED 0xA2 U+00A2 #CENT SIGN 0xA3 U+00A3 #POUND SIGN 0xA4 U+00A4 #CURRENCY SIGN -#0xA5 #UNDEFINED +0xA5 #UNDEFINED 0xA6 U+00A6 #BROKEN BAR 0xA7 U+00A7 #SECTION SIGN 0xA8 U+00D8 #LATIN CAPITAL LETTER O WITH STROKE |