1 <?xml version="1.0"?>
\r
3 <codeTable name="Basic and Extended Latin" date="January 2000" number="1">
\r
4 <note>The first column in this table contains the MARC-8 code (in hex) for
\r
5 the character as coming from the G0 graphic set, the second column
\r
6 contains the MARC-8 code (in hex) for the character as coming from the G1
\r
7 graphic set, the third column contains the UCS/Unicode 16-bit code (in
\r
8 hex), the fourth column contains the UTF-8 code (in hex) for the UCS
\r
9 characters, the fifth column contains a representation of the character (where possible),
\r
10 the sixth column contains the MARC character name, followed
\r
11 by the UCS name. If the MARC name is the same as or very similar to the
\r
12 UCS name, only the UCS name is given. For some tables alternate encodings
\r
13 in Unicode and UTF-8 are given. When that occurs the alternate Unicode and
\r
14 alternate UTF-8 columns follow the character name. </note>
\r
15 <characterSet name="Basic Latin (ASCII)" ISOcode="42">
\r
20 <name>ESCAPE (Unlikely to occur in UCS/Unicode)</name>
\r
26 <name>RECORD TERMINATOR / GROUP SEPARATOR</name>
\r
32 <name>FIELD TERMINATOR / RECORD SEPARATOR</name>
\r
38 <name>SUBFIELD DELIMITER / UNIT SEPARATOR</name>
\r
44 <name>SPACE, BLANK / SPACE</name>
\r
50 <name>EXCLAMATION MARK</name>
\r
56 <name>QUOTATION MARK</name>
\r
62 <name>NUMBER SIGN</name>
\r
68 <name>DOLLAR SIGN</name>
\r
74 <name>PERCENT SIGN</name>
\r
80 <name>AMPERSAND</name>
\r
86 <name>APOSTROPHE</name>
\r
92 <name>OPENING PARENTHESIS / LEFT PARENTHESIS</name>
\r
98 <name>CLOSING PARENTHESIS / CLOSING PARENTHESIS</name>
\r
104 <name>ASTERISK</name>
\r
110 <name>PLUS SIGN</name>
\r
122 <name>HYPHEN-MINUS</name>
\r
128 <name>PERIOD, DECIMAL POINT / FULL STOP</name>
\r
134 <name>SLASH / SOLIDUS</name>
\r
140 <name>DIGIT ZERO</name>
\r
146 <name>DIGIT ONE</name>
\r
152 <name>DIGIT TWO</name>
\r
158 <name>DIGIT THREE</name>
\r
164 <name>DIGIT FOUR</name>
\r
170 <name>DIGIT FIVE</name>
\r
176 <name>DIGIT SIX</name>
\r
182 <name>DIGIT SEVEN</name>
\r
188 <name>DIGIT EIGHT</name>
\r
194 <name>DIGIT NINE</name>
\r
206 <name>SEMICOLON</name>
\r
212 <name>LESS-THAN SIGN</name>
\r
218 <name>EQUALS SIGN</name>
\r
224 <name>GREATER-THAN SIGN</name>
\r
230 <name>QUESTION MARK</name>
\r
236 <name>COMMERCIAL AT</name>
\r
242 <name>LATIN CAPITAL LETTER A</name>
\r
248 <name>LATIN CAPITAL LETTER B</name>
\r
254 <name>LATIN CAPITAL LETTER C</name>
\r
260 <name>LATIN CAPITAL LETTER D</name>
\r
266 <name>LATIN CAPITAL LETTER E</name>
\r
272 <name>LATIN CAPITAL LETTER F</name>
\r
278 <name>LATIN CAPITAL LETTER G</name>
\r
284 <name>LATIN CAPITAL LETTER H</name>
\r
290 <name>LATIN CAPITAL LETTER I</name>
\r
296 <name>LATIN CAPITAL LETTER J</name>
\r
302 <name>LATIN CAPITAL LETTER K</name>
\r
308 <name>LATIN CAPITAL LETTER L</name>
\r
314 <name>LATIN CAPITAL LETTER M</name>
\r
320 <name>LATIN CAPITAL LETTER N</name>
\r
326 <name>LATIN CAPITAL LETTER O</name>
\r
332 <name>LATIN CAPITAL LETTER P</name>
\r
338 <name>LATIN CAPITAL LETTER Q</name>
\r
344 <name>LATIN CAPITAL LETTER R</name>
\r
350 <name>LATIN CAPITAL LETTER S</name>
\r
356 <name>LATIN CAPITAL LETTER T</name>
\r
362 <name>LATIN CAPITAL LETTER U</name>
\r
368 <name>LATIN CAPITAL LETTER V</name>
\r
374 <name>LATIN CAPITAL LETTER W</name>
\r
380 <name>LATIN CAPITAL LETTER X</name>
\r
386 <name>LATIN CAPITAL LETTER Y</name>
\r
392 <name>LATIN CAPITAL LETTER Z</name>
\r
398 <name>OPENING SQUARE BRACKET / LEFT SQUARE
\r
405 <name>REVERSE SLASH / REVERSE SOLIDUS</name>
\r
411 <name>CLOSING SQUARE BRACKET / RIGHT SQUARE
\r
418 <name>SPACING CIRCUMFLEX / CIRCUMFLEX ACCENT</name>
\r
424 <name>SPACING UNDERSCORE / LOW LINE</name>
\r
430 <name>SPACING GRAVE / GRAVE ACCENT</name>
\r
436 <name>LATIN SMALL LETTER A</name>
\r
442 <name>LATIN SMALL LETTER B</name>
\r
448 <name>LATIN SMALL LETTER C</name>
\r
454 <name>LATIN SMALL LETTER D</name>
\r
460 <name>LATIN SMALL LETTER E</name>
\r
466 <name>LATIN SMALL LETTER F</name>
\r
472 <name>LATIN SMALL LETTER G</name>
\r
478 <name>LATIN SMALL LETTER H</name>
\r
484 <name>LATIN SMALL LETTER I</name>
\r
490 <name>LATIN SMALL LETTER J</name>
\r
496 <name>LATIN SMALL LETTER K</name>
\r
502 <name>LATIN SMALL LETTER L</name>
\r
508 <name>LATIN SMALL LETTER M</name>
\r
514 <name>LATIN SMALL LETTER N</name>
\r
520 <name>LATIN SMALL LETTER O</name>
\r
526 <name>LATIN SMALL LETTER P</name>
\r
532 <name>LATIN SMALL LETTER Q</name>
\r
538 <name>LATIN SMALL LETTER R</name>
\r
544 <name>LATIN SMALL LETTER S</name>
\r
550 <name>LATIN SMALL LETTER T</name>
\r
556 <name>LATIN SMALL LETTER U</name>
\r
562 <name>LATIN SMALL LETTER V</name>
\r
568 <name>LATIN SMALL LETTER W</name>
\r
574 <name>LATIN SMALL LETTER X</name>
\r
580 <name>LATIN SMALL LETTER Y</name>
\r
586 <name>LATIN SMALL LETTER Z</name>
\r
592 <name>OPENING CURLY BRACKET / LEFT CURLY
\r
599 <name>VERTICAL BAR (FILL) / VERTICAL LINE</name>
\r
605 <name>CLOSING CURLY BRACKET / RIGHT CURLY
\r
612 <name>SPACING TILDE / TILDE</name>
\r
615 <characterSet name="Extended Latin (ANSEL)" date="January 2000, Updated September 2004" ISOcode="45">
\r
616 <note>Revised June 2004 to add the Eszett (M+C7) and the
\r
617 Euro Sign (M+C8) to the MARC-8 set.</note>
\r
619 <note>Revised September 2004 to change the mapping from
\r
620 MARC-8 to Unicode for the Ligature (M+EB and M+EC) from U+FE20 and U+FE21
\r
622 <note>Revised September 2004 to change the mapping from
\r
623 MARC-8 to Unicode for the Double Tilde (M+FA and M+FB) from U+FE22 and U+FE23
\r
625 <note>Revised March 2005 to change the mapping from MARC-8 to Unicode
\r
626 for the Alif (M+2E) from U+02BE to U+02BC.</note>
\r
630 <utf-8>C298</utf-8>
\r
631 <name>NON-SORT BEGIN / START OF STRING</name>
\r
636 <utf-8>C29C</utf-8>
\r
637 <name>NON-SORT END / STRING TERMINATOR</name>
\r
642 <utf-8>E2808D</utf-8>
\r
643 <name>JOINER / ZERO WIDTH JOINER</name>
\r
648 <utf-8>E2808C</utf-8>
\r
649 <name>NON-JOINER / ZERO WIDTH NON-JOINER</name>
\r
654 <utf-8>C581</utf-8>
\r
655 <name>UPPERCASE POLISH L / LATIN CAPITAL LETTER L WITH
\r
661 <utf-8>C398</utf-8>
\r
662 <name>UPPERCASE SCANDINAVIAN O / LATIN CAPITAL LETTER
\r
663 O WITH STROKE</name>
\r
668 <utf-8>C490</utf-8>
\r
669 <name>UPPERCASE D WITH CROSSBAR / LATIN CAPITAL LETTER
\r
670 D WITH STROKE</name>
\r
675 <utf-8>C39E</utf-8>
\r
676 <name>UPPERCASE ICELANDIC THORN / LATIN CAPITAL LETTER
\r
677 THORN (Icelandic)</name>
\r
682 <utf-8>C386</utf-8>
\r
683 <name>UPPERCASE DIGRAPH AE / LATIN CAPITAL LIGATURE
\r
689 <utf-8>C592</utf-8>
\r
690 <name>UPPERCASE DIGRAPH OE / LATIN CAPITAL LIGATURE
\r
696 <utf-8>CAB9</utf-8>
\r
697 <name>SOFT SIGN, PRIME / MODIFIER LETTER PRIME</name>
\r
702 <utf-8>C2B7</utf-8>
\r
703 <name>MIDDLE DOT</name>
\r
708 <utf-8>E299AD</utf-8>
\r
709 <name>MUSIC FLAT SIGN</name>
\r
714 <utf-8>C2AE</utf-8>
\r
715 <name>PATENT MARK / REGISTERED SIGN</name>
\r
720 <utf-8>C2B1</utf-8>
\r
721 <name>PLUS OR MINUS / PLUS-MINUS SIGN</name>
\r
726 <utf-8>C6A0</utf-8>
\r
727 <name>UPPERCASE O-HOOK / LATIN CAPITAL LETTER O WITH
\r
733 <utf-8>C6AF</utf-8>
\r
734 <name>UPPERCASE U-HOOK / LATIN CAPITAL LETTER U WITH
\r
740 <utf-8>CABC</utf-8>
\r
741 <name>ALIF / MODIFIER LETTER APOSTROPHE</name>
\r
746 <utf-8>CABB</utf-8>
\r
747 <name>AYN / MODIFIER LETTER TURNED COMMA</name>
\r
752 <utf-8>C582</utf-8>
\r
753 <name>LOWERCASE POLISH L / LATIN SMALL LETTER L WITH
\r
759 <utf-8>C3B8</utf-8>
\r
760 <name>LOWERCASE SCANDINAVIAN O / LATIN SMALL LETTER O
\r
766 <utf-8>C491</utf-8>
\r
767 <name>LOWERCASE D WITH CROSSBAR / LATIN SMALL LETTER
\r
768 D WITH STROKE</name>
\r
773 <utf-8>C3BE</utf-8>
\r
774 <name>LOWERCASE ICELANDIC THORN / LATIN SMALL LETTER
\r
775 THORN (Icelandic)</name>
\r
780 <utf-8>C3A6</utf-8>
\r
781 <name>LOWERCASE DIGRAPH AE / LATIN SMALL LIGATURE
\r
787 <utf-8>C593</utf-8>
\r
788 <name>LOWERCASE DIGRAPH OE / LATIN SMALL LIGATURE
\r
794 <utf-8>CABA</utf-8>
\r
795 <name>HARD SIGN, DOUBLE PRIME / MODIFIER LETTER DOUBLE
\r
801 <utf-8>C4B1</utf-8>
\r
802 <name>LOWERCASE TURKISH I / LATIN SMALL LETTER DOTLESS
\r
808 <utf-8>C2A3</utf-8>
\r
809 <name>BRITISH POUND / POUND SIGN</name>
\r
814 <utf-8>C3B0</utf-8>
\r
815 <name>LOWERCASE ETH / LATIN SMALL LETTER ETH
\r
821 <utf-8>C6A1</utf-8>
\r
822 <name>LOWERCASE O-HOOK / LATIN SMALL LETTER O WITH
\r
828 <utf-8>C6B0</utf-8>
\r
829 <name>LOWERCASE U-HOOK / LATIN SMALL LETTER U WITH
\r
835 <utf-8>C2B0</utf-8>
\r
836 <name>DEGREE SIGN</name>
\r
841 <utf-8>E28493</utf-8>
\r
842 <name>SCRIPT SMALL L</name>
\r
847 <utf-8>E28497</utf-8>
\r
848 <name>SOUND RECORDING COPYRIGHT</name>
\r
853 <utf-8>C2A9</utf-8>
\r
854 <name>COPYRIGHT SIGN</name>
\r
859 <utf-8>E299AF</utf-8>
\r
860 <name>MUSIC SHARP SIGN</name>
\r
865 <utf-8>C2BF</utf-8>
\r
866 <name>INVERTED QUESTION MARK</name>
\r
871 <utf-8>C2A1</utf-8>
\r
872 <name>INVERTED EXCLAMATION MARK</name>
\r
877 <utf-8>C39F</utf-8>
\r
878 <name>ESZETT SYMBOL</name>
\r
883 <utf-8>E282AC</utf-8>
\r
884 <name>EURO SIGN</name>
\r
887 <isCombining>true</isCombining>
\r
890 <utf-8>CC89</utf-8>
\r
891 <name>PSEUDO QUESTION MARK / COMBINING HOOK
\r
895 <isCombining>true</isCombining>
\r
898 <utf-8>CC80</utf-8>
\r
899 <name>GRAVE / COMBINING GRAVE ACCENT (Varia)</name>
\r
902 <isCombining>true</isCombining>
\r
905 <utf-8>CC81</utf-8>
\r
906 <name>ACUTE / COMBINING ACUTE ACCENT (Oxia)</name>
\r
909 <isCombining>true</isCombining>
\r
912 <utf-8>CC82</utf-8>
\r
913 <name>CIRCUMFLEX / COMBINING CIRCUMFLEX
\r
917 <isCombining>true</isCombining>
\r
920 <utf-8>CC83</utf-8>
\r
921 <name>TILDE / COMBINING TILDE</name>
\r
924 <isCombining>true</isCombining>
\r
927 <utf-8>CC84</utf-8>
\r
928 <name>MACRON / COMBINING MACRON</name>
\r
931 <isCombining>true</isCombining>
\r
934 <utf-8>CC86</utf-8>
\r
935 <name>BREVE / COMBINING BREVE (Vrachy)</name>
\r
938 <isCombining>true</isCombining>
\r
941 <utf-8>CC87</utf-8>
\r
942 <name>SUPERIOR DOT / COMBINING DOT ABOVE</name>
\r
945 <isCombining>true</isCombining>
\r
948 <utf-8>CC88</utf-8>
\r
949 <name>UMLAUT, DIAERESIS / COMBINING DIAERESIS
\r
953 <isCombining>true</isCombining>
\r
956 <utf-8>CC8C</utf-8>
\r
957 <name>HACEK / COMBINING CARON</name>
\r
960 <isCombining>true</isCombining>
\r
963 <utf-8>CC8A</utf-8>
\r
964 <name>CIRCLE ABOVE, ANGSTROM / COMBINING RING
\r
968 <isCombining>true</isCombining>
\r
971 <utf-8>CDA1</utf-8>
\r
973 <altutf-8>EFB8A0</altutf-8>
\r
974 <name>LIGATURE, FIRST HALF / COMBINING DOUBLE
\r
975 INVERTED BREVE</name>
\r
978 <isCombining>true</isCombining>
\r
983 <altutf-8>EFB8A1</altutf-8>
\r
984 <name>LIGATURE, SECOND HALF / COMBINING LIGATURE RIGHT HALF</name>
\r
985 <note>The Ligature that spans two characters
\r
986 is constructed of two halves in MARC-8: EB
\r
987 (Ligature, first half) and EC (Ligature, second
\r
988 half). The preferred Unicode/UTF-8 mapping is to
\r
989 the single character Ligature that spans two characters,
\r
990 U+0361. The single character Ligature is encoded
\r
991 following the second of the two characters to be spanned.
\r
992 The two half Ligatures in Unicode, to which the
\r
993 Ligature has been mapped since 1996, are indicted
\r
994 in the mapping as alternatives, but their use is not
\r
995 recommended. It is expected that font support for
\r
996 the single character Ligature mark will be more
\r
997 easily obtained than for the two halves.</note>
\r
1000 <isCombining>true</isCombining>
\r
1003 <utf-8>CC95</utf-8>
\r
1004 <name>HIGH COMMA, OFF CENTER / COMBINING COMMA ABOVE
\r
1008 <isCombining>true</isCombining>
\r
1011 <utf-8>CC8B</utf-8>
\r
1012 <name>DOUBLE ACUTE / COMBINING DOUBLE ACUTE
\r
1016 <isCombining>true</isCombining>
\r
1019 <utf-8>CC90</utf-8>
\r
1020 <name>CANDRABINDU / COMBINING CANDRABINDU</name>
\r
1023 <isCombining>true</isCombining>
\r
1026 <utf-8>CCA7</utf-8>
\r
1027 <name>CEDILLA / COMBINING CEDILLA</name>
\r
1030 <isCombining>true</isCombining>
\r
1033 <utf-8>CCA8</utf-8>
\r
1034 <name>RIGHT HOOK, OGONEK / COMBINING OGONEK</name>
\r
1037 <isCombining>true</isCombining>
\r
1040 <utf-8>CCA3</utf-8>
\r
1041 <name>DOT BELOW / COMBINING DOT BELOW</name>
\r
1044 <isCombining>true</isCombining>
\r
1047 <utf-8>CCA4</utf-8>
\r
1048 <name>DOUBLE DOT BELOW / COMBINING DIAERESIS
\r
1052 <isCombining>true</isCombining>
\r
1055 <utf-8>CCA5</utf-8>
\r
1056 <name>CIRCLE BELOW / COMBINING RING BELOW</name>
\r
1059 <isCombining>true</isCombining>
\r
1062 <utf-8>CCB3</utf-8>
\r
1063 <name>DOUBLE UNDERSCORE / COMBINING DOUBLE LOW
\r
1067 <isCombining>true</isCombining>
\r
1070 <utf-8>CCB2</utf-8>
\r
1071 <name>UNDERSCORE / COMBINING LOW LINE</name>
\r
1074 <isCombining>true</isCombining>
\r
1077 <utf-8>CCA6</utf-8>
\r
1078 <name>LEFT HOOK (COMMA BELOW) / COMBINING COMMA
\r
1082 <isCombining>true</isCombining>
\r
1085 <utf-8>CC9C</utf-8>
\r
1086 <name>RIGHT CEDILLA / COMBINING LEFT HALF RING
\r
1090 <isCombining>true</isCombining>
\r
1093 <utf-8>CCAE</utf-8>
\r
1094 <name>UPADHMANIYA / COMBINING BREVE BELOW</name>
\r
1097 <isCombining>true</isCombining>
\r
1100 <utf-8>CDA0</utf-8>
\r
1102 <altutf-8>EFB8A2</altutf-8>
\r
1103 <name>DOUBLE TILDE, FIRST HALF / COMBINING DOUBLE TILDE</name>
\r
1106 <isCombining>true</isCombining>
\r
1111 <altutf-8>EFB8A3</altutf-8>
\r
1112 <name>DOUBLE TILDE, SECOND HALF / COMBINING DOUBLE TILDE RIGHT HALF</name>
\r
1113 <note>The Double Tilde that spans two characters is
\r
1114 constructed of two halves in MARC-8: FA (Double
\r
1115 Tilde, first half) and FB (Double Tilde, second
\r
1116 half). The preferred Unicode/UTF-8 mapping
\r
1117 is to the single character Double Tilde that
\r
1118 spans two characters, U+0360. The single
\r
1119 character Double Tilde is encoded following
\r
1120 the second of the two characters to be spanned.
\r
1121 The two half Double Tildes in Unicode, to
\r
1122 which the MARC8 Double Tilde has been
\r
1123 mapped since 1996, are indicted in the
\r
1124 mapping as alternatives, but their use is not
\r
1125 recommended. It is expected that font support
\r
1126 for the single character Double Tilde mark will
\r
1127 be more easily obtained than for the two halves.</note>
\r
1130 <isCombining>true</isCombining>
\r
1133 <utf-8>CC93</utf-8>
\r
1134 <name>HIGH COMMA, CENTERED / COMBINING COMMA ABOVE
\r
1139 <codeTable name="Greek Symbols" date="January 2000, Updated September 2004" number="2">
\r
1140 <note>The first column in this table contains the MARC-8 code (in hex) for
\r
1141 the character, the second column contains the UCS/Unicode 16-bit code (in
\r
1142 hex), the third column contains the UTF-8 code (in hex) for the UCS
\r
1143 character, the fourth column contains a representation of the character (where possible),
\r
1144 the fifth column contains the MARC character name, followed by
\r
1145 the UCS name. If the MARC name is the same as or very similar to the UCS
\r
1146 name, only the UCS name is given.</note>
\r
1147 <note>Note added September 2004: The alpha, beta and gamma symbols that have been part of a
\r
1148 special extension of the MARC8 character set since 1970 do not
\r
1149 have reversible mappings to Unicode since they duplicate
\r
1150 characters in the Greek script set. These special characters
\r
1151 map to the Greek set in Unicode, thus when being remapped to
\r
1152 MARC-8 they go to the MARC-8 Greek set, not the special
\r
1153 extension to the Latin set. It is recommended that the
\r
1154 spelling out of the characters be used when the Latin
\r
1155 extension Greek characters would formerly have been used,
\r
1156 i.e., when they occur in Latin text. The following
\r
1157 substitutions would be made: [alpha], [beta], and [gamma].</note>
\r
1158 <characterSet name="Greek Symbols" ISOcode="67">
\r
1162 <utf-8>CEB1</utf-8>
\r
1163 <name>GREEK SMALL LETTER ALPHA</name>
\r
1168 <utf-8>CEB2</utf-8>
\r
1169 <name>GREEK SMALL LETTER BETA</name>
\r
1174 <utf-8>CEB3</utf-8>
\r
1175 <name>GREEK SMALL LETTER GAMMA</name>
\r
1179 <codeTable name="Subscripts" date="January 2000" number="3">
\r
1180 <note>The first column in this table contains the MARC-8 code (in hex) for
\r
1181 the character, the second column contains the UCS/Unicode 16-bit code (in
\r
1182 hex), the third column contains the UTF-8 code (in hex) for the UCS
\r
1183 character, the fourth column contains a representation of the character (where possible),
\r
1184 the fifth column contains the MARC character name, followed by
\r
1185 the UCS name. If the MARC name is the same as or very similar to the UCS
\r
1186 name, only the UCS name is given.</note>
\r
1187 <characterSet name="Subscripts" ISOcode="62">
\r
1191 <utf-8>E2828D</utf-8>
\r
1192 <name>SUBSCRIPT OPENING PARENTHESIS / SUBSCRIPT LEFT
\r
1193 PARENTHESIS</name>
\r
1198 <utf-8>E2828E</utf-8>
\r
1199 <name>SUBSCRIPT CLOSING PARENTHESIS / SUBSCRIPT RIGHT
\r
1200 PARENTHESIS</name>
\r
1205 <utf-8>E2828A</utf-8>
\r
1206 <name>SUBSCRIPT PLUS SIGN</name>
\r
1211 <utf-8>E2828B</utf-8>
\r
1212 <name>SUBSCRIPT HYPHEN-MINUS / SUBSCRIPT MINUS</name>
\r
1217 <utf-8>E28280</utf-8>
\r
1218 <name>SUBSCRIPT DIGIT ZERO</name>
\r
1223 <utf-8>E28281</utf-8>
\r
1224 <name>SUBSCRIPT DIGIT ONE</name>
\r
1229 <utf-8>E28282</utf-8>
\r
1230 <name>SUBSCRIPT DIGIT TWO</name>
\r
1235 <utf-8>E28283</utf-8>
\r
1236 <name>SUBSCRIPT DIGIT THREE</name>
\r
1241 <utf-8>E28284</utf-8>
\r
1242 <name>SUBSCRIPT DIGIT FOUR</name>
\r
1247 <utf-8>E28285</utf-8>
\r
1248 <name>SUBSCRIPT DIGIT FIVE</name>
\r
1253 <utf-8>E28286</utf-8>
\r
1254 <name>SUBSCRIPT DIGIT SIX</name>
\r
1259 <utf-8>E28287</utf-8>
\r
1260 <name>SUBSCRIPT DIGIT SEVEN</name>
\r
1265 <utf-8>E28288</utf-8>
\r
1266 <name>SUBSCRIPT DIGIT EIGHT</name>
\r
1271 <utf-8>E28289</utf-8>
\r
1272 <name>SUBSCRIPT DIGIT NINE</name>
\r
1276 <codeTable name="Superscripts" date="January 2000" number="4">
\r
1277 <note>The first column in this table contains the MARC-8 code (in hex) for
\r
1278 the character, the second column contains the UCS/Unicode 16-bit code (in
\r
1279 hex), the third column contains the UTF-8 code (in hex) for the UCS
\r
1280 character, the fourth column contains a representation of the character (where possible),
\r
1281 the fifth column conatins the MARC character name, followed by
\r
1282 the UCS name. If the MARC name is the same as or very similar to the UCS
\r
1283 name, only the UCS name is given.</note>
\r
1284 <characterSet name="Superscripts" ISOcode="70">
\r
1288 <utf-8>E281BD</utf-8>
\r
1289 <name>SUPERSCRIPT OPENING PARENTHESIS / SUPERSCRIPT LEFT
\r
1290 PARENTHESIS</name>
\r
1295 <utf-8>E281BE</utf-8>
\r
1296 <name>SUPERSCRIPT CLOSING PARENTHESIS / SUPERSCRIPT
\r
1297 RIGHT PARENTHESIS</name>
\r
1302 <utf-8>E281BA</utf-8>
\r
1303 <name>SUPERSCRIPT PLUS SIGN</name>
\r
1308 <utf-8>E281BB</utf-8>
\r
1309 <name>SUPERSCRIPT HYPHEN-MINUS / SUPERSCRIPT
\r
1315 <utf-8>E281B0</utf-8>
\r
1316 <name>SUPERSCRIPT DIGIT ZERO</name>
\r
1321 <utf-8>C2B9</utf-8>
\r
1322 <name>SUPERSCRIPT DIGIT ONE</name>
\r
1327 <utf-8>C2B2</utf-8>
\r
1328 <name>SUPERSCRIPT DIGIT TWO</name>
\r
1333 <utf-8>C2B3</utf-8>
\r
1334 <name>SUPERSCRIPT DIGIT THREE</name>
\r
1339 <utf-8>E281B4</utf-8>
\r
1340 <name>SUPERSCRIPT DIGIT FOUR</name>
\r
1345 <utf-8>E281B5</utf-8>
\r
1346 <name>SUPERSCRIPT DIGIT FIVE</name>
\r
1351 <utf-8>E281B6</utf-8>
\r
1352 <name>SUPERSCRIPT DIGIT SIX</name>
\r
1357 <utf-8>E281B7</utf-8>
\r
1358 <name>SUPERSCRIPT DIGIT SEVEN</name>
\r
1363 <utf-8>E281B8</utf-8>
\r
1364 <name>SUPERSCRIPT DIGIT EIGHT</name>
\r
1369 <utf-8>E281B9</utf-8>
\r
1370 <name>SUPERSCRIPT DIGIT NINE</name>
\r
1374 <codeTable name="Basic Hebrew" date="January 2000" number="5">
\r
1375 <note>The first column in this table contains the MARC-8 code (in hex) for
\r
1376 the character as coming from the G0 graphic set, the second column
\r
1377 contains the MARC-8 code (in hex) for the character as coming from the G1
\r
1378 graphic set, the third column contains the UCS/Unicode 16-bit code (in
\r
1379 hex), the fourth column contains the UTF-8 code (in hex) for the UCS
\r
1380 characters, the fifth column contains a representation of the character (where possible),
\r
1381 the sixth column contains the MARC character name, followed
\r
1382 by the UCS name. If the MARC name is the same as or very similar to the
\r
1383 UCS name, only the UCS name is given.</note>
\r
1384 <characterSet name="Basic Hebrew" ISOcode="32">
\r
1389 <name>EXCLAMATION MARK</name>
\r
1394 <utf-8>D7B4</utf-8>
\r
1395 <name>QUOTATION MARK, GERSHAYIM / HEBREW PUNCTUATION
\r
1402 <name>NUMBER SIGN</name>
\r
1408 <name>DOLLAR SIGN</name>
\r
1414 <name>PERCENT SIGN</name>
\r
1420 <name>AMPERSAND</name>
\r
1425 <utf-8>D7B3</utf-8>
\r
1426 <name>APOSTROPHE, GERESH / HEBREW PUNCTUATION
\r
1433 <name>OPENING PARENTHESIS / LEFT PARENTHESIS</name>
\r
1439 <name>CLOSING PARENTHESIS / RIGHT PARENTHESIS</name>
\r
1445 <name>ASTERISK</name>
\r
1451 <name>PLUS SIGN</name>
\r
1457 <name>COMMA</name>
\r
1462 <utf-8>D6BE</utf-8>
\r
1463 <name>HYPHEN-MINUS, MAKEF / HEBREW PUNCTUATION
\r
1470 <name>PERIOD, DECIMAL POINT / FULL STOP</name>
\r
1476 <name>SLASH / SOLIDUS</name>
\r
1482 <name>DIGIT ZERO</name>
\r
1488 <name>DIGIT ONE</name>
\r
1494 <name>DIGIT TWO</name>
\r
1500 <name>DIGIT THREE</name>
\r
1506 <name>DIGIT FOUR</name>
\r
1512 <name>DIGIT FIVE</name>
\r
1518 <name>DIGIT SIX</name>
\r
1524 <name>DIGIT SEVEN</name>
\r
1530 <name>DIGIT EIGHT</name>
\r
1536 <name>DIGIT NINE</name>
\r
1542 <name>COLON</name>
\r
1548 <name>SEMICOLON</name>
\r
1554 <name>LESS-THAN SIGN</name>
\r
1560 <name>EQUALS SIGN</name>
\r
1566 <name>GREATER-THAN SIGN</name>
\r
1572 <name>QUESTION MARK</name>
\r
1575 <isCombining>true</isCombining>
\r
1578 <utf-8>D6B7</utf-8>
\r
1579 <name>HEBREW POINT PATAH</name>
\r
1582 <isCombining>true</isCombining>
\r
1585 <utf-8>D6B8</utf-8>
\r
1586 <name>KAMATS / HEBREW POINT QAMATS</name>
\r
1589 <isCombining>true</isCombining>
\r
1592 <utf-8>D6B6</utf-8>
\r
1593 <name>HEBREW POINT SEGOL</name>
\r
1596 <isCombining>true</isCombining>
\r
1599 <utf-8>D6B5</utf-8>
\r
1600 <name>TSEREH / HEBREW POINT TSERE</name>
\r
1603 <isCombining>true</isCombining>
\r
1606 <utf-8>D6B4</utf-8>
\r
1607 <name>HIRIK / HEBREW POINT HIRIQ</name>
\r
1610 <isCombining>true</isCombining>
\r
1613 <utf-8>D6B9</utf-8>
\r
1614 <name>HOLAM, LEFT SIN DOT / HEBREW POINT HOLAM</name>
\r
1617 <isCombining>true</isCombining>
\r
1620 <utf-8>D6BB</utf-8>
\r
1621 <name>KUBUTS / HEBREW POINT QUBUTS</name>
\r
1624 <isCombining>true</isCombining>
\r
1627 <utf-8>D6B0</utf-8>
\r
1628 <name>HEBREW POINT SHEVA</name>
\r
1631 <isCombining>true</isCombining>
\r
1634 <utf-8>D6B2</utf-8>
\r
1635 <name>HEBREW POINT HATAF PATAH</name>
\r
1638 <isCombining>true</isCombining>
\r
1641 <utf-8>D6B3</utf-8>
\r
1642 <name>HATAF KAMATS / HEBREW POINT HATAF QAMATS</name>
\r
1645 <isCombining>true</isCombining>
\r
1648 <utf-8>D6B1</utf-8>
\r
1649 <name>HEBREW POINT HATAF SEGOL</name>
\r
1652 <isCombining>true</isCombining>
\r
1655 <utf-8>D6BC</utf-8>
\r
1656 <name>HEBREW POINT DAGESH OR MAPIQ</name>
\r
1659 <isCombining>true</isCombining>
\r
1662 <utf-8>D6BF</utf-8>
\r
1663 <name>RAFEH / HEBREW POINT RAFE</name>
\r
1666 <isCombining>true</isCombining>
\r
1669 <utf-8>D781</utf-8>
\r
1670 <name>RIGHT SHIN DOT / HEBREW POINT SHIN DOT</name>
\r
1673 <isCombining>true</isCombining>
\r
1676 <utf-8>EFAC9E</utf-8>
\r
1677 <name>VARIKA / HEBREW POINT JUDEO-SPANISH
\r
1684 <name>OPENING SQUARE BRACKET / LEFT SQUARE
\r
1691 <name>CLOSING SQUARE BRACKET / RIGHT SQUARE
\r
1697 <utf-8>D790</utf-8>
\r
1698 <name>HEBREW LETTER ALEF</name>
\r
1703 <utf-8>D791</utf-8>
\r
1704 <name>HEBREW LETTER BET</name>
\r
1709 <utf-8>D792</utf-8>
\r
1710 <name>HEBREW LETTER GIMEL</name>
\r
1715 <utf-8>D793</utf-8>
\r
1716 <name>HEBREW LETTER DALET</name>
\r
1721 <utf-8>D794</utf-8>
\r
1722 <name>HEBREW LETTER HE</name>
\r
1727 <utf-8>D795</utf-8>
\r
1728 <name>HEBREW LETTER VAV</name>
\r
1733 <utf-8>D796</utf-8>
\r
1734 <name>HEBREW LETTER ZAYIN</name>
\r
1739 <utf-8>D797</utf-8>
\r
1740 <name>HEBREW LETTER HET</name>
\r
1745 <utf-8>D798</utf-8>
\r
1746 <name>HEBREW LETTER TET</name>
\r
1751 <utf-8>D799</utf-8>
\r
1752 <name>HEBREW LETTER YOD</name>
\r
1757 <utf-8>D79A</utf-8>
\r
1758 <name>HEBREW LETTER FINAL KAF</name>
\r
1763 <utf-8>D79B</utf-8>
\r
1764 <name>HEBREW LETTER KAF</name>
\r
1769 <utf-8>D79C</utf-8>
\r
1770 <name>HEBREW LETTER LAMED</name>
\r
1775 <utf-8>D79D</utf-8>
\r
1776 <name>HEBREW LETTER FINAL MEM</name>
\r
1781 <utf-8>D79E</utf-8>
\r
1782 <name>HEBREW LETTER MEM</name>
\r
1787 <utf-8>D79F</utf-8>
\r
1788 <name>HEBREW LETTER FINAL NUN</name>
\r
1793 <utf-8>D7A0</utf-8>
\r
1794 <name>HEBREW LETTER NUN</name>
\r
1799 <utf-8>D7A1</utf-8>
\r
1800 <name>HEBREW LETTER SAMEKH</name>
\r
1805 <utf-8>D7A2</utf-8>
\r
1806 <name>HEBREW LETTER AYIN</name>
\r
1811 <utf-8>D7A3</utf-8>
\r
1812 <name>HEBREW LETTER FINAL PE</name>
\r
1817 <utf-8>D7A4</utf-8>
\r
1818 <name>HEBREW LETTER PE</name>
\r
1823 <utf-8>D7A5</utf-8>
\r
1824 <name>HEBREW LETTER FINAL TSADI</name>
\r
1829 <utf-8>D7A6</utf-8>
\r
1830 <name>HEBREW LETTER TSADI</name>
\r
1835 <utf-8>D7A7</utf-8>
\r
1836 <name>HEBREW LETTER QOF / KOF</name>
\r
1841 <utf-8>D7A8</utf-8>
\r
1842 <name>HEBREW LETTER RESH</name>
\r
1847 <utf-8>D7A9</utf-8>
\r
1848 <name>HEBREW LETTER SHIN</name>
\r
1853 <utf-8>D7AA</utf-8>
\r
1854 <name>HEBREW LETTER TAV</name>
\r
1859 <utf-8>D7B0</utf-8>
\r
1860 <name>HEBREW LIGATURE YIDDISH DOUBLE VAV / TSVEY
\r
1866 <utf-8>D7B1</utf-8>
\r
1867 <name>HEBREW LIGATURE YIDDISH VAV YOD / VOV
\r
1873 <utf-8>D7B2</utf-8>
\r
1874 <name>HEBREW LIGATURE YIDDISH DOUBLE YOD / TSVEY
\r
1879 <codeTable name="Basic and Extended Cyrillic" date="January 2000" number="6">
\r
1880 <note>The first column in this table contains the MARC-8 code (in hex) for
\r
1881 the character as coming from the G0 graphic set, the second column
\r
1882 contains the MARC-8 code (in hex) for the character as coming from the G1
\r
1883 graphic set, the third column contains the UCS/Unicode 16-bit code (in
\r
1884 hex), the fourth column contains the UTF-8 code (in hex) for the UCS
\r
1885 characters, the fifth column contains a representation of the character (where possible),
\r
1886 the sixth column contains the MARC character name, followed
\r
1887 by the UCS name. If the MARC name is the same as or very similar to the
\r
1888 UCS name, only the UCS name is given.</note>
\r
1889 <characterSet name="Basic Cyrillic" ISOcode="4E">
\r
1894 <name>EXCLAMATION MARK</name>
\r
1900 <name>QUOTATION MARK</name>
\r
1906 <name>NUMBER SIGN</name>
\r
1912 <name>DOLLAR SIGN</name>
\r
1918 <name>PERCENT SIGN</name>
\r
1924 <name>AMPERSAND</name>
\r
1930 <name>APOSTROPHE</name>
\r
1936 <name>OPENING PARENTHESIS / LEFT PARENTHESIS</name>
\r
1942 <name>CLOSING PARENTHESIS / RIGHT PARENTHESIS</name>
\r
1948 <name>ASTERISK</name>
\r
1954 <name>PLUS SIGN</name>
\r
1960 <name>COMMA</name>
\r
1966 <name>HYPHEN-MINUS</name>
\r
1972 <name>PERIOD, DECIMAL POINT / FULL STOP</name>
\r
1978 <name>SLASH / SOLIDUS</name>
\r
1984 <name>DIGIT ZERO</name>
\r
1990 <name>DIGIT ONE</name>
\r
1996 <name>DIGIT TWO</name>
\r
2002 <name>DIGIT THREE</name>
\r
2008 <name>DIGIT FOUR</name>
\r
2014 <name>DIGIT FIVE</name>
\r
2020 <name>DIGIT SIX</name>
\r
2026 <name>DIGIT SEVEN</name>
\r
2032 <name>DIGIT EIGHT</name>
\r
2038 <name>DIGIT NINE</name>
\r
2044 <name>COLON</name>
\r
2050 <name>SEMICOLON</name>
\r
2056 <name>LESS-THAN SIGN</name>
\r
2062 <name>EQUALS SIGN</name>
\r
2068 <name>GREATER-THAN SIGN</name>
\r
2074 <name>QUESTION MARK</name>
\r
2079 <utf-8>D18E</utf-8>
\r
2080 <name>LOWERCASE IU / CYRILLIC SMALL LETTER YU</name>
\r
2085 <utf-8>D0B0</utf-8>
\r
2086 <name>CYRILLIC SMALL LETTER A</name>
\r
2091 <utf-8>D0B1</utf-8>
\r
2092 <name>CYRILLIC SMALL LETTER BE</name>
\r
2097 <utf-8>D186</utf-8>
\r
2098 <name>CYRILLIC SMALL LETTER TSE</name>
\r
2103 <utf-8>D0B4</utf-8>
\r
2104 <name>CYRILLIC SMALL LETTER DE</name>
\r
2109 <utf-8>D0B5</utf-8>
\r
2110 <name>CYRILLIC SMALL LETTER IE</name>
\r
2115 <utf-8>D184</utf-8>
\r
2116 <name>CYRILLIC SMALL LETTER EF</name>
\r
2121 <utf-8>D0B3</utf-8>
\r
2122 <name>LOWERCASE GE / CYRILLIC SMALL LETTER GHE</name>
\r
2127 <utf-8>D185</utf-8>
\r
2128 <name>LOWERCASE KHA / CYRILLIC SMALL LETTER HA</name>
\r
2133 <utf-8>D0B8</utf-8>
\r
2134 <name>LOWERCASE II / CYRILLIC SMALL LETTER I</name>
\r
2139 <utf-8>D0B9</utf-8>
\r
2140 <name>LOWERCASE SHORT II / CYRILLIC SMALL LETTER SHORT
\r
2146 <utf-8>D0BA</utf-8>
\r
2147 <name>CYRILLIC SMALL LETTER KA</name>
\r
2152 <utf-8>D0BB</utf-8>
\r
2153 <name>CYRILLIC SMALL LETTER EL</name>
\r
2158 <utf-8>D0BC</utf-8>
\r
2159 <name>CYRILLIC SMALL LETTER EM</name>
\r
2164 <utf-8>D0BD</utf-8>
\r
2165 <name>CYRILLIC SMALL LETTER EN</name>
\r
2170 <utf-8>D0BE</utf-8>
\r
2171 <name>CYRILLIC SMALL LETTER O</name>
\r
2176 <utf-8>D0BF</utf-8>
\r
2177 <name>CYRILLIC SMALL LETTER PE</name>
\r
2182 <utf-8>D18F</utf-8>
\r
2183 <name>LOWERCASE IA / CYRILLIC SMALL LETTER YA</name>
\r
2188 <utf-8>D180</utf-8>
\r
2189 <name>CYRILLIC SMALL LETTER ER</name>
\r
2194 <utf-8>D181</utf-8>
\r
2195 <name>CYRILLIC SMALL LETTER ES</name>
\r
2200 <utf-8>D182</utf-8>
\r
2201 <name>CYRILLIC SMALL LETTER TE</name>
\r
2206 <utf-8>D183</utf-8>
\r
2207 <name>CYRILLIC SMALL LETTER U</name>
\r
2212 <utf-8>D0B6</utf-8>
\r
2213 <name>CYRILLIC SMALL LETTER ZHE</name>
\r
2218 <utf-8>D0B2</utf-8>
\r
2219 <name>CYRILLIC SMALL LETTER VE</name>
\r
2224 <utf-8>D18C</utf-8>
\r
2225 <name>CYRILLIC SMALL LETTER SOFT SIGN</name>
\r
2230 <utf-8>D18B</utf-8>
\r
2231 <name>LOWERCASE YERI / CYRILLIC SMALL LETTER
\r
2237 <utf-8>D0B7</utf-8>
\r
2238 <name>CYRILLIC SMALL LETTER ZE</name>
\r
2243 <utf-8>D188</utf-8>
\r
2244 <name>CYRILLIC SMALL LETTER SHA</name>
\r
2249 <utf-8>D18D</utf-8>
\r
2250 <name>LOWERCASE REVERSED E / CYRILLIC SMALL LETTER
\r
2256 <utf-8>D189</utf-8>
\r
2257 <name>CYRILLIC SMALL LETTER SHCHA</name>
\r
2262 <utf-8>D187</utf-8>
\r
2263 <name>CYRILLIC SMALL LETTER CHE</name>
\r
2268 <utf-8>D18A</utf-8>
\r
2269 <name>CYRILLIC SMALL LETTER HARD SIGN</name>
\r
2274 <utf-8>D0AE</utf-8>
\r
2275 <name>UPPERCASE IU / CYRILLIC CAPITAL LETTER YU</name>
\r
2280 <utf-8>D090</utf-8>
\r
2281 <name>CYRILLIC CAPITAL LETTER A</name>
\r
2286 <utf-8>D091</utf-8>
\r
2287 <name>CYRILLIC CAPITAL LETTER BE</name>
\r
2292 <utf-8>D0A6</utf-8>
\r
2293 <name>CYRILLIC CAPITAL LETTER TSE</name>
\r
2298 <utf-8>D094</utf-8>
\r
2299 <name>CYRILLIC CAPITAL LETTER DE</name>
\r
2304 <utf-8>D095</utf-8>
\r
2305 <name>CYRILLIC CAPITAL LETTER IE</name>
\r
2310 <utf-8>D0A4</utf-8>
\r
2311 <name>CYRILLIC CAPITAL LETTER EF</name>
\r
2316 <utf-8>D093</utf-8>
\r
2317 <name>UPPERCASE GE / CYRILLIC CAPITAL LETTER GHE</name>
\r
2322 <utf-8>D0A5</utf-8>
\r
2323 <name>UPPERCASE KHA / CYRILLIC CAPITAL LETTER HA</name>
\r
2328 <utf-8>D098</utf-8>
\r
2329 <name>UPPERCASE II / CYRILLIC CAPITAL LETTER I</name>
\r
2334 <utf-8>D099</utf-8>
\r
2335 <name>UPPERCASE SHORT II / CYRILLIC CAPITAL LETTER SHORT
\r
2341 <utf-8>D09A</utf-8>
\r
2342 <name>CYRILLIC CAPITAL LETTER KA</name>
\r
2347 <utf-8>D09B</utf-8>
\r
2348 <name>CYRILLIC CAPITAL LETTER EL</name>
\r
2353 <utf-8>D09C</utf-8>
\r
2354 <name>CYRILLIC CAPITAL LETTER EM</name>
\r
2359 <utf-8>D09D</utf-8>
\r
2360 <name>CYRILLIC CAPITAL LETTER EN</name>
\r
2365 <utf-8>D09E</utf-8>
\r
2366 <name>CYRILLIC CAPITAL LETTER O</name>
\r
2371 <utf-8>D09F</utf-8>
\r
2372 <name>CYRILLIC CAPITAL LETTER PE</name>
\r
2377 <utf-8>D0AF</utf-8>
\r
2378 <name>UPPERCASE IA / CYRILLIC CAPITAL LETTER YA</name>
\r
2383 <utf-8>D0A0</utf-8>
\r
2384 <name>CYRILLIC CAPITAL LETTER ER</name>
\r
2389 <utf-8>D0A1</utf-8>
\r
2390 <name>CYRILLIC CAPITAL LETTER ES</name>
\r
2395 <utf-8>D0A2</utf-8>
\r
2396 <name>CYRILLIC CAPITAL LETTER TE</name>
\r
2401 <utf-8>D0A3</utf-8>
\r
2402 <name>CYRILLIC CAPITAL LETTER U</name>
\r
2407 <utf-8>D096</utf-8>
\r
2408 <name>CYRILLIC CAPITAL LETTER ZHE</name>
\r
2413 <utf-8>D092</utf-8>
\r
2414 <name>CYRILLIC CAPITAL LETTER VE</name>
\r
2419 <utf-8>D0AC</utf-8>
\r
2420 <name>CYRILLIC CAPITAL LETTER SOFT SIGN</name>
\r
2425 <utf-8>D0AB</utf-8>
\r
2426 <name>UPPERCASE YERI / CYRILLIC CAPITAL LETTER
\r
2432 <utf-8>D097</utf-8>
\r
2433 <name>CYRILLIC CAPITAL LETTER ZE</name>
\r
2438 <utf-8>D0A8</utf-8>
\r
2439 <name>CYRILLIC CAPITAL LETTER SHA</name>
\r
2444 <utf-8>D0AD</utf-8>
\r
2445 <name>CYRILLIC CAPITAL LETTER E</name>
\r
2450 <utf-8>D0A9</utf-8>
\r
2451 <name>CYRILLIC CAPITAL LETTER SHCHA</name>
\r
2456 <utf-8>D0A7</utf-8>
\r
2457 <name>CYRILLIC CAPITAL LETTER CHE</name>
\r
2460 <characterSet name="Extended Cyrillic" ISOcode="51">
\r
2464 <utf-8>D291</utf-8>
\r
2465 <name>LOWERCASE GE WITH UPTURN / CYRILLIC SMALL LETTER
\r
2466 GHE WITH UPTURN</name>
\r
2471 <utf-8>D192</utf-8>
\r
2472 <name>LOWERCASE DJE / CYRILLIC SMALL LETTER DJE
\r
2478 <utf-8>D193</utf-8>
\r
2479 <name>CYRILLIC SMALL LETTER GJE</name>
\r
2484 <utf-8>D194</utf-8>
\r
2485 <name>LOWERCASE E / CYRILLIC SMALL LETTER UKRAINIAN
\r
2491 <utf-8>D191</utf-8>
\r
2492 <name>CYRILLIC SMALL LETTER IO</name>
\r
2497 <utf-8>D195</utf-8>
\r
2498 <name>CYRILLIC SMALL LETTER DZE</name>
\r
2503 <utf-8>D196</utf-8>
\r
2504 <name>LOWERCASE I / CYRILLIC SMALL LETTER
\r
2505 BYELORUSSIAN-UKRANIAN I</name>
\r
2510 <utf-8>D197</utf-8>
\r
2511 <name>LOWERCASE YI / CYRILLIC SMALL LETTER YI
\r
2512 (Ukrainian)</name>
\r
2517 <utf-8>D198</utf-8>
\r
2518 <name>CYRILLIC SMALL LETTER JE</name>
\r
2523 <utf-8>D199</utf-8>
\r
2524 <name>CYRILLIC SMALL LETTER LJE</name>
\r
2529 <utf-8>D19A</utf-8>
\r
2530 <name>CYRILLIC SMALL LETTER NJE</name>
\r
2535 <utf-8>D19B</utf-8>
\r
2536 <name>LOWERCASE TSHE / CYRILLIC SMALL LETTER TSHE
\r
2542 <utf-8>D19C</utf-8>
\r
2543 <name>CYRILLIC SMALL LETTER KJE</name>
\r
2548 <utf-8>D19E</utf-8>
\r
2549 <name>LOWERCASE SHORT U / CYRILLIC SMALL LETTER SHORT
\r
2550 U (Byelorussian)</name>
\r
2555 <utf-8>D19F</utf-8>
\r
2556 <name>CYRILLIC SMALL LETTER DZHE</name>
\r
2561 <utf-8>D1A3</utf-8>
\r
2562 <name>CYRILLIC SMALL LETTER YAT</name>
\r
2567 <utf-8>D1B3</utf-8>
\r
2568 <name>CYRILLIC SMALL LETTER FITA</name>
\r
2573 <utf-8>D1B5</utf-8>
\r
2574 <name>CYRILLIC SMALL LETTER IZHITSA</name>
\r
2579 <utf-8>D1AB</utf-8>
\r
2580 <name>CYRILLIC SMALL LETTER BIG YUS</name>
\r
2586 <name>OPENING SQUARE BRACKET / LEFT SQUARE
\r
2593 <name>CLOSING SQUARE BRACKET / RIGHT SQUARE
\r
2600 <name>SPACING UNDERSCORE / LOW LINE</name>
\r
2605 <utf-8>D290</utf-8>
\r
2606 <name>UPPERCASE GE WITH UPTURN / CYRILLIC CAPITAL
\r
2607 LETTER GHE WITH UPTURN</name>
\r
2612 <utf-8>D082</utf-8>
\r
2613 <name>UPPERCASE DJE / CYRILLIC CAPITAL LETTER DJE
\r
2619 <utf-8>D083</utf-8>
\r
2620 <name>CYRILLIC CAPITAL LETTER GJE</name>
\r
2625 <utf-8>D084</utf-8>
\r
2626 <name>UPPERCASE E / CYRILLIC CAPITAL LETTER UKRAINIAN
\r
2632 <utf-8>D081</utf-8>
\r
2633 <name>CYRILLIC CAPITAL LETTER IO</name>
\r
2638 <utf-8>D085</utf-8>
\r
2639 <name>CYRILLIC CAPITAL LETTER DZE</name>
\r
2644 <utf-8>D086</utf-8>
\r
2645 <name>UPPERCASE I / CYRILLIC CAPITAL LETTER
\r
2646 BYELORUSSIAN-UKRANIAN I</name>
\r
2651 <utf-8>D087</utf-8>
\r
2652 <name>UPPERCASE YI / CYRILLIC CAPITAL LETTER YI
\r
2653 (Ukrainian)</name>
\r
2658 <utf-8>D088</utf-8>
\r
2659 <name>CYRILLIC CAPITAL LETTER JE</name>
\r
2664 <utf-8>D089</utf-8>
\r
2665 <name>CYRILLIC CAPITAL LETTER LJE</name>
\r
2670 <utf-8>D08A</utf-8>
\r
2671 <name>CYRILLIC CAPITAL LETTER NJE</name>
\r
2676 <utf-8>D08B</utf-8>
\r
2677 <name>UPPERCASE TSHE / CYRILLIC CAPITAL LETTER TSHE
\r
2683 <utf-8>D08C</utf-8>
\r
2684 <name>CYRILLIC CAPITAL LETTER KJE</name>
\r
2689 <utf-8>D08E</utf-8>
\r
2690 <name>UPPERCASE SHORT U / CYRILLIC CAPITAL LETTER SHORT
\r
2691 U (Byelorussian)</name>
\r
2696 <utf-8>D08F</utf-8>
\r
2697 <name>CYRILLIC CAPITAL LETTER DZHE</name>
\r
2702 <utf-8>D0AA</utf-8>
\r
2703 <name>CYRILLIC CAPITAL LETTER HARD SIGN</name>
\r
2708 <utf-8>D1A2</utf-8>
\r
2709 <name>CYRILLIC CAPITAL LETTER YAT</name>
\r
2714 <utf-8>D1B2</utf-8>
\r
2715 <name>CYRILLIC CAPITAL LETTER FITA</name>
\r
2720 <utf-8>D1B4</utf-8>
\r
2721 <name>CYRILLIC CAPITAL LETTER IZHITSA</name>
\r
2726 <utf-8>D1AA</utf-8>
\r
2727 <name>CYRILLIC CAPITAL LETTER BIG YUS</name>
\r
2731 <codeTable name="Basic and Extended Arabic" date="July 2001" number="7">
\r
2732 <note>The first column in this table contains the MARC-8 code (in hex) for
\r
2733 the character as coming from the G0 graphic set, the second column
\r
2734 contains the MARC-8 code (in hex) for the character as coming from the G1
\r
2735 graphic set, the third column contains the UCS/Unicode 16-bit code (in
\r
2736 hex), the fourth column contains the UTF-8 code (in hex) for the UCS
\r
2737 characters, the fifth column contains a representation of the character (where possible),
\r
2738 the sixth column contains the MARC character name, followed
\r
2739 by the UCS name. If the MARC name is the same as or very similar to the
\r
2740 UCS name, only the UCS name is given.</note>
\r
2741 <characterSet name="Basic Arabic" ISOcode="33">
\r
2746 <name>EXCLAMATION MARK</name>
\r
2752 <name>QUOTATION MARK</name>
\r
2758 <name>NUMBER SIGN</name>
\r
2764 <name>DOLLAR SIGN</name>
\r
2769 <utf-8>D9AA</utf-8>
\r
2770 <name>PERCENT SIGN / ARABIC PERCENT SIGN</name>
\r
2776 <name>AMPERSAND</name>
\r
2782 <name>APOSTROPHE</name>
\r
2788 <name>OPENING PARENTHESIS / LEFT PARENTHESIS</name>
\r
2794 <name>CLOSING PARENTHESIS / RIGHT PARENTHESIS</name>
\r
2799 <utf-8>D9AD</utf-8>
\r
2800 <name>ASTERISK / ARABIC FIVE POINTED STAR</name>
\r
2806 <name>PLUS SIGN</name>
\r
2811 <utf-8>D88C</utf-8>
\r
2812 <name>ARABIC COMMA</name>
\r
2818 <name>HYPHEN-MINUS</name>
\r
2824 <name>PERIOD, DECIMAL POINT / FULL STOP</name>
\r
2830 <name>SLASH / SOLIDUS</name>
\r
2835 <utf-8>D9A0</utf-8>
\r
2836 <name>ARABIC-INDIC DIGIT ZERO</name>
\r
2841 <utf-8>D9A1</utf-8>
\r
2842 <name>ARABIC-INDIC DIGIT ONE</name>
\r
2847 <utf-8>D9A2</utf-8>
\r
2848 <name>ARABIC-INDIC DIGIT TWO</name>
\r
2853 <utf-8>D9A3</utf-8>
\r
2854 <name>ARABIC-INDIC DIGIT THREE</name>
\r
2859 <utf-8>D9A4</utf-8>
\r
2860 <name>ARABIC-INDIC DIGIT FOUR</name>
\r
2865 <utf-8>D9A5</utf-8>
\r
2866 <name>ARABIC-INDIC DIGIT FIVE</name>
\r
2871 <utf-8>D9A6</utf-8>
\r
2872 <name>ARABIC-INDIC DIGIT SIX</name>
\r
2877 <utf-8>D9A7</utf-8>
\r
2878 <name>ARABIC-INDIC DIGIT SEVEN</name>
\r
2883 <utf-8>D9A8</utf-8>
\r
2884 <name>ARABIC-INDIC DIGIT EIGHT</name>
\r
2889 <utf-8>D9A9</utf-8>
\r
2890 <name>ARABIC-INDIC DIGIT NINE</name>
\r
2896 <name>COLON</name>
\r
2901 <utf-8>D89B</utf-8>
\r
2902 <name>ARABIC SEMICOLON</name>
\r
2908 <name>LESS-THAN SIGN</name>
\r
2914 <name>EQUALS SIGN</name>
\r
2920 <name>GREATER-THAN SIGN</name>
\r
2925 <utf-8>D89F</utf-8>
\r
2926 <name>ARABIC QUESTION MARK</name>
\r
2931 <utf-8>D8A1</utf-8>
\r
2932 <name>HAMZAH / ARABIC LETTER HAMZA</name>
\r
2937 <utf-8>D8A2</utf-8>
\r
2938 <name>ARABIC LETTER ALEF WITH MADDA ABOVE</name>
\r
2943 <utf-8>D8A3</utf-8>
\r
2944 <name>ARABIC LETTER ALEF WITH HAMZA ABOVE</name>
\r
2949 <utf-8>D8A4</utf-8>
\r
2950 <name>ARABIC LETTER WAW WITH HAMZA ABOVE</name>
\r
2955 <utf-8>D8A5</utf-8>
\r
2956 <name>ARABIC LETTER ALEF WITH HAMZA BELOW</name>
\r
2961 <utf-8>D8A6</utf-8>
\r
2962 <name>ARABIC LETTER YEH WITH HAMZA ABOVE</name>
\r
2967 <utf-8>D8A7</utf-8>
\r
2968 <name>ARABIC LETTER ALEF</name>
\r
2973 <utf-8>D8A8</utf-8>
\r
2974 <name>ARABIC LETTER BEH</name>
\r
2979 <utf-8>D8A9</utf-8>
\r
2980 <name>ARABIC LETTER TEH MARBUTA</name>
\r
2985 <utf-8>D8AA</utf-8>
\r
2986 <name>ARABIC LETTER TEH</name>
\r
2991 <utf-8>D8AB</utf-8>
\r
2992 <name>ARABIC LETTER THEH</name>
\r
2997 <utf-8>D8AC</utf-8>
\r
2998 <name>ARABIC LETTER JEEM</name>
\r
3003 <utf-8>D8AD</utf-8>
\r
3004 <name>ARABIC LETTER HAH</name>
\r
3009 <utf-8>D8AE</utf-8>
\r
3010 <name>ARABIC LETTER KHAH</name>
\r
3015 <utf-8>D8AF</utf-8>
\r
3016 <name>ARABIC LETTER DAL</name>
\r
3021 <utf-8>D8B0</utf-8>
\r
3022 <name>ARABIC LETTER THAL</name>
\r
3027 <utf-8>D8B1</utf-8>
\r
3028 <name>ARABIC LETTER REH</name>
\r
3033 <utf-8>D8B2</utf-8>
\r
3034 <name>ARABIC LETTER ZAIN</name>
\r
3039 <utf-8>D8B3</utf-8>
\r
3040 <name>ARABIC LETTER SEEN</name>
\r
3045 <utf-8>D8B4</utf-8>
\r
3046 <name>ARABIC LETTER SHEEN</name>
\r
3051 <utf-8>D8B5</utf-8>
\r
3052 <name>ARABIC LETTER SAD</name>
\r
3057 <utf-8>D8B6</utf-8>
\r
3058 <name>ARABIC LETTER DAD</name>
\r
3063 <utf-8>D8B7</utf-8>
\r
3064 <name>ARABIC LETTER TAH</name>
\r
3069 <utf-8>D8B8</utf-8>
\r
3070 <name>ARABIC LETTER ZAH</name>
\r
3075 <utf-8>D8B9</utf-8>
\r
3076 <name>ARABIC LETTER AIN</name>
\r
3081 <utf-8>D8BA</utf-8>
\r
3082 <name>ARABIC LETTER GHAIN</name>
\r
3088 <name>OPENING SQUARE BRACKET / LEFT SQUARE
\r
3095 <name>CLOSING SQUARE BRACKET / RIGHT SQUARE
\r
3101 <utf-8>D980</utf-8>
\r
3102 <name>ARABIC TATWEEL</name>
\r
3107 <utf-8>D981</utf-8>
\r
3108 <name>ARABIC LETTER FEH</name>
\r
3113 <utf-8>D982</utf-8>
\r
3114 <name>ARABIC LETTER QAF</name>
\r
3119 <utf-8>D983</utf-8>
\r
3120 <name>ARABIC LETTER KAF</name>
\r
3125 <utf-8>D984</utf-8>
\r
3126 <name>ARABIC LETTER LAM</name>
\r
3131 <utf-8>D985</utf-8>
\r
3132 <name>ARABIC LETTER MEEM</name>
\r
3137 <utf-8>D986</utf-8>
\r
3138 <name>ARABIC LETTER NOON</name>
\r
3143 <utf-8>D987</utf-8>
\r
3144 <name>ARABIC LETTER HEH</name>
\r
3149 <utf-8>D988</utf-8>
\r
3150 <name>ARABIC LETTER WAW</name>
\r
3155 <utf-8>D989</utf-8>
\r
3156 <name>ARABIC LETTER ALEF MAKSURA</name>
\r
3161 <utf-8>D98A</utf-8>
\r
3162 <name>ARABIC LETTER YEH</name>
\r
3165 <isCombining>true</isCombining>
\r
3168 <utf-8>D98B</utf-8>
\r
3169 <name>ARABIC FATHATAN</name>
\r
3172 <isCombining>true</isCombining>
\r
3175 <utf-8>D98C</utf-8>
\r
3176 <name>ARABIC DAMMATAN</name>
\r
3179 <isCombining>true</isCombining>
\r
3182 <utf-8>D98D</utf-8>
\r
3183 <name>ARABIC KASRATAN</name>
\r
3186 <isCombining>true</isCombining>
\r
3189 <utf-8>D98E</utf-8>
\r
3190 <name>ARABIC FATHA</name>
\r
3193 <isCombining>true</isCombining>
\r
3196 <utf-8>D98F</utf-8>
\r
3197 <name>ARABIC DAMMA</name>
\r
3200 <isCombining>true</isCombining>
\r
3203 <utf-8>D990</utf-8>
\r
3204 <name>ARABIC KASRA</name>
\r
3207 <isCombining>true</isCombining>
\r
3210 <utf-8>D991</utf-8>
\r
3211 <name>ARABIC SHADDA</name>
\r
3214 <isCombining>true</isCombining>
\r
3217 <utf-8>D992</utf-8>
\r
3218 <name>ARABIC SUKUN</name>
\r
3223 <utf-8>D9B1</utf-8>
\r
3224 <name>ARABIC LETTER ALEF WASLA</name>
\r
3229 <utf-8>D9B0</utf-8>
\r
3230 <name>ARABIC LETTER SUPERSCRIPT ALEF</name>
\r
3235 <utf-8>D9AC</utf-8>
\r
3236 <name>ARABIC THOUSANDS SEPARATOR</name>
\r
3241 <utf-8>E2809D</utf-8>
\r
3242 <name>RIGHT DOUBLE QUOTATION MARK</name>
\r
3247 <utf-8>E2809C</utf-8>
\r
3248 <name>LEFT DOUBLE QUOTATION MARK</name>
\r
3251 <characterSet name="Extended Arabic" ISOcode="34">
\r
3255 <utf-8>DBBD</utf-8>
\r
3256 <name>DOUBLE ALEF WITH HAMZA ABOVE / ARABIC SIGN SINDHI
\r
3262 <utf-8>D9B2</utf-8>
\r
3263 <name>ARABIC LETTER ALEF WITH WAVY HAMZA
\r
3269 <utf-8>D9B3</utf-8>
\r
3270 <name>ARABIC LETTER ALEF WITH WAVY HAMZA
\r
3276 <utf-8>D9B9</utf-8>
\r
3277 <name>ARABIC LETTER TTEH</name>
\r
3282 <utf-8>D9BA</utf-8>
\r
3283 <name>ARABIC LETTER TTEHEH</name>
\r
3288 <utf-8>D9BB</utf-8>
\r
3289 <name>ARABIC LETTER BBEH</name>
\r
3294 <utf-8>D9BC</utf-8>
\r
3295 <name>ARABIC LETTER TEH WITH RING</name>
\r
3300 <utf-8>D9BD</utf-8>
\r
3301 <name>ARABIC LETTER TEH WITH THREE DOTS ABOVE
\r
3307 <utf-8>D9BE</utf-8>
\r
3308 <name>ARABIC LETTER PEH</name>
\r
3313 <utf-8>D9BF</utf-8>
\r
3314 <name>ARABIC LETTER TEHEH</name>
\r
3319 <utf-8>DA80</utf-8>
\r
3320 <name>ARABIC LETTER BEHEH</name>
\r
3325 <utf-8>DA81</utf-8>
\r
3326 <name>ARABIC LETTER HAH WITH HAMZA ABOVE</name>
\r
3331 <utf-8>DA82</utf-8>
\r
3332 <name>ARABIC LETTER HAH WITH TWO ABOVE DOTS VERTICAL
\r
3338 <utf-8>DA83</utf-8>
\r
3339 <name>ARABIC LETTER NYEH</name>
\r
3344 <utf-8>DA84</utf-8>
\r
3345 <name>ARABIC LETTER DYEH</name>
\r
3350 <utf-8>DA85</utf-8>
\r
3351 <name>ARABIC LETTER HAH WITH THREE DOTS ABOVE</name>
\r
3356 <utf-8>DA86</utf-8>
\r
3357 <name>ARABIC LETTER TCHEH</name>
\r
3362 <utf-8>DABF</utf-8>
\r
3363 <name>ARABIC LETTER TCHEH WITH DOT ABOVE</name>
\r
3368 <utf-8>DA87</utf-8>
\r
3369 <name>ARABIC LETTER TCHEHEH</name>
\r
3374 <utf-8>DA88</utf-8>
\r
3375 <name>ARABIC LETTER DDAL</name>
\r
3380 <utf-8>DA89</utf-8>
\r
3381 <name>ARABIC LETTER DAL WITH RING</name>
\r
3386 <utf-8>DA8A</utf-8>
\r
3387 <name>ARABIC LETTER DAL WITH DOT BELOW</name>
\r
3392 <utf-8>DA8B</utf-8>
\r
3393 <name>ARABIC LETTER DAL WITH DOT BELOW AND SMALL
\r
3399 <utf-8>DA8C</utf-8>
\r
3400 <name>ARABIC LETTER DAHAL</name>
\r
3405 <utf-8>DA8D</utf-8>
\r
3406 <name>ARABIC LETTER DDAHAL</name>
\r
3411 <utf-8>DA8E</utf-8>
\r
3412 <name>ARABIC LETTER DUL</name>
\r
3417 <utf-8>DA8F</utf-8>
\r
3418 <name>ARABIC LETTER DAL WITH THREE DOTS ABOVE
\r
3424 <utf-8>DA90</utf-8>
\r
3425 <name>ARABIC LETTER DAL WITH FOUR DOTS ABOVE</name>
\r
3430 <utf-8>DA91</utf-8>
\r
3431 <name>ARABIC LETTER RREH</name>
\r
3436 <utf-8>DA92</utf-8>
\r
3437 <name>ARABIC LETTER REH WITH SMALL V</name>
\r
3442 <utf-8>DA93</utf-8>
\r
3443 <name>ARABIC LETTER REH WITH RING</name>
\r
3448 <utf-8>DA94</utf-8>
\r
3449 <name>ARABIC LETTER REH WITH DOT BELOW</name>
\r
3454 <utf-8>DA95</utf-8>
\r
3455 <name>ARABIC LETTER REH WITH SMALL V BELOW</name>
\r
3460 <utf-8>DA96</utf-8>
\r
3461 <name>ARABIC LETTER REH WITH DOT BELOW AND DOT
\r
3467 <utf-8>DA97</utf-8>
\r
3468 <name>ARABIC LETTER REH WITH TWO DOTS ABOVE</name>
\r
3473 <utf-8>DA98</utf-8>
\r
3474 <name>ARABIC LETTER JEH</name>
\r
3479 <utf-8>DA99</utf-8>
\r
3480 <name>ARABIC LETTER REH WITH FOUR DOTS ABOVE</name>
\r
3485 <utf-8>DA9A</utf-8>
\r
3486 <name>ARABIC LETTER SEEN WITH DOT BELOW AND DOT
\r
3492 <utf-8>DA9B</utf-8>
\r
3493 <name>ARABIC LETTER SEEN WITH THREE DOTS BELOW</name>
\r
3498 <utf-8>DA9C</utf-8>
\r
3499 <name>ARABIC LETTER SEEN WITH THREE DOTS BELOW AND
\r
3500 THREE DOTS ABOVE</name>
\r
3505 <utf-8>DBBA</utf-8>
\r
3506 <name>ARABIC LETTER SHEEN WITH DOT BELOW</name>
\r
3511 <utf-8>DA9D</utf-8>
\r
3512 <name>ARABIC LETTER SAD WITH TWO DOTS BELOW</name>
\r
3517 <utf-8>DA9E</utf-8>
\r
3518 <name>ARABIC LETTER SAD WITH THREE DOTS ABOVE</name>
\r
3523 <utf-8>DBBB</utf-8>
\r
3524 <name>ARABIC LETTER DAD WITH DOT BELOW</name>
\r
3529 <utf-8>DA9F</utf-8>
\r
3530 <name>ARABIC LETTER TAH WITH THREE DOTS ABOVE</name>
\r
3535 <utf-8>DAA0</utf-8>
\r
3536 <name>ARABIC LETTER AIN WITH THREE DOTS ABOVE</name>
\r
3541 <utf-8>DBBC</utf-8>
\r
3542 <name>ARABIC LETTER GHAIN WITH DOT BELOW</name>
\r
3547 <utf-8>DAA1</utf-8>
\r
3548 <name>ARABIC LETTER DOTLESS FEH</name>
\r
3553 <utf-8>DAA2</utf-8>
\r
3554 <name>ARABIC LETTER FEH WITH DOT MOVED BELOW</name>
\r
3559 <utf-8>DAA3</utf-8>
\r
3560 <name>ARABIC LETTER FEH WITH DOT BELOW</name>
\r
3565 <utf-8>DAA4</utf-8>
\r
3566 <name>ARABIC LETTER VEH</name>
\r
3571 <utf-8>DAA5</utf-8>
\r
3572 <name>ARABIC LETTER FEH WITH THREE DOTS BELOW</name>
\r
3577 <utf-8>DAA6</utf-8>
\r
3578 <name>ARABIC LETTER PEHEH</name>
\r
3583 <utf-8>DAA7</utf-8>
\r
3584 <name>ARABIC LETTER QAF WITH DOT ABOVE</name>
\r
3589 <utf-8>DAA8</utf-8>
\r
3590 <name>ARABIC LETTER QAF WITH THREE DOTS ABOVE</name>
\r
3595 <utf-8>DAA9</utf-8>
\r
3596 <name>ARABIC LETTER KEHEH</name>
\r
3601 <utf-8>DAAA</utf-8>
\r
3602 <name>ARABIC LETTER SWASH KAF</name>
\r
3607 <utf-8>DAAB</utf-8>
\r
3608 <name>ARABIC LETTER KAF WITH RING</name>
\r
3613 <utf-8>DAAC</utf-8>
\r
3614 <name>ARABIC LETTER KAF WITH DOT ABOVE</name>
\r
3619 <utf-8>DAAD</utf-8>
\r
3620 <name>ARABIC LETTER NG</name>
\r
3625 <utf-8>DAAE</utf-8>
\r
3626 <name>ARABIC LETTER KAF WITH THREE DOTS BELOW</name>
\r
3631 <utf-8>DAAF</utf-8>
\r
3632 <name>ARABIC LETTER GAF</name>
\r
3637 <utf-8>DAB0</utf-8>
\r
3638 <name>ARABIC LETTER GAF WITH RING</name>
\r
3643 <utf-8>DAB1</utf-8>
\r
3644 <name>ARABIC LETTER NGOEH</name>
\r
3649 <utf-8>DAB2</utf-8>
\r
3650 <name>ARABIC LETTER GAF WITH TWO DOTS BELOW</name>
\r
3655 <utf-8>DAB3</utf-8>
\r
3656 <name>ARABIC LETTER GUEH</name>
\r
3661 <utf-8>DAB4</utf-8>
\r
3662 <name>ARABIC LETTER GAF WITH THREE DOTS ABOVE</name>
\r
3667 <utf-8>DAB5</utf-8>
\r
3668 <name>ARABIC LETTER LAM WITH SMALL V</name>
\r
3673 <utf-8>DAB6</utf-8>
\r
3674 <name>ARABIC LETTER LAM WITH DOT ABOVE</name>
\r
3679 <utf-8>DAB7</utf-8>
\r
3680 <name>ARABIC LETTER LAM WITH THREE DOTS ABOVE</name>
\r
3685 <utf-8>DAB8</utf-8>
\r
3686 <name>ARABIC LETTER LAM WITH THREE DOTS BELOW</name>
\r
3691 <utf-8>DABA</utf-8>
\r
3692 <name>ARABIC LETTER NOON GHUNNA</name>
\r
3697 <utf-8>DABB</utf-8>
\r
3698 <name>ARABIC LETTER RNOON</name>
\r
3703 <utf-8>DABC</utf-8>
\r
3704 <name>ARABIC LETTER NOON WITH RING</name>
\r
3709 <utf-8>DABD</utf-8>
\r
3710 <name>ARABIC LETTER NOON WITH THREE DOTS ABOVE</name>
\r
3715 <utf-8>DAB9</utf-8>
\r
3716 <name>ARABIC LETTER NOON WITH DOT BELOW</name>
\r
3721 <utf-8>DABE</utf-8>
\r
3722 <name>ARABIC LETTER HEH DOACHASHMEE</name>
\r
3727 <utf-8>DB80</utf-8>
\r
3728 <name>HEH WITH HAMZA ABOVE / ARABIC LETTER HEH WITH
\r
3734 <utf-8>DB84</utf-8>
\r
3735 <name>ARABIC LETTER WAW WITH RING</name>
\r
3740 <utf-8>DB85</utf-8>
\r
3741 <name>KYRGHYZ OE / ARABIC LETTER KIRGHIZ OE</name>
\r
3746 <utf-8>DB86</utf-8>
\r
3747 <name>ARABIC LETTER OE</name>
\r
3752 <utf-8>DB8A</utf-8>
\r
3753 <name>ARABIC LETTER WAW WITH TWO DOTS ABOVE</name>
\r
3758 <utf-8>DB8B</utf-8>
\r
3759 <name>ARABIC LETTER VE</name>
\r
3764 <utf-8>DB8D</utf-8>
\r
3765 <name>ARABIC LETTER YEH WITH TAIL</name>
\r
3770 <utf-8>DB8E</utf-8>
\r
3771 <name>ARABIC LETTER YEH WITH SMALL V</name>
\r
3776 <utf-8>DB90</utf-8>
\r
3777 <name>ARABIC LETTER E</name>
\r
3782 <utf-8>DB92</utf-8>
\r
3783 <name>ARABIC LETTER YEH BARREE</name>
\r
3788 <utf-8>DB93</utf-8>
\r
3789 <name>ARABIC LETTER YEH BARREE WITH HAMZA
\r
3793 <isCombining>true</isCombining>
\r
3796 <utf-8>CC86</utf-8>
\r
3797 <name>SHORT E / COMBINING BREVE</name>
\r
3800 <isCombining>true</isCombining>
\r
3803 <utf-8>CC8C</utf-8>
\r
3804 <name>SHORT U / COMBINING CARON</name>
\r
3808 <codeTable name="Greek" date="January 2000" number="8">
\r
3809 <note>The first column in this table contains the MARC-8 code (in hex) for
\r
3810 the character as coming from the G0 graphic set, the second column
\r
3811 contains the MARC-8 code (in hex) for the character as coming from the G1
\r
3812 graphic set, the third column contains the UCS/Unicode 16-bit code (in
\r
3813 hex), the fourth column contains the UTF-8 code (in hex) for the UCS
\r
3814 characters, the fifth column contains a representation of the character (where possible),
\r
3815 the sixth column contains the MARC character name, followed
\r
3816 by the UCS name. If the MARC name is the same as or very similar to the
\r
3817 UCS name, only the UCS name is given.</note>
\r
3818 <characterSet name="Basic Greek" ISOcode="53">
\r
3820 <isCombining>true</isCombining>
\r
3823 <utf-8>CC80</utf-8>
\r
3824 <name>COMBINING GRAVE ACCENT</name>
\r
3827 <isCombining>true</isCombining>
\r
3830 <utf-8>CC81</utf-8>
\r
3831 <name>COMBINING ACUTE ACCENT</name>
\r
3834 <isCombining>true</isCombining>
\r
3837 <utf-8>CC88</utf-8>
\r
3838 <name>COMBINING DIAERESIS</name>
\r
3841 <isCombining>true</isCombining>
\r
3844 <utf-8>CD82</utf-8>
\r
3845 <name>COMBINING GREEK PERISPOMENI / CIRCUMFLEX</name>
\r
3848 <isCombining>true</isCombining>
\r
3851 <utf-8>CC93</utf-8>
\r
3852 <name>COMBINING COMMA ABOVE / SMOOTH
\r
3856 <isCombining>true</isCombining>
\r
3859 <utf-8>CC94</utf-8>
\r
3860 <name>COMBINING REVERSED COMMA ABOVE / ROUGH
\r
3864 <isCombining>true</isCombining>
\r
3867 <utf-8>CD85</utf-8>
\r
3868 <name>COMBINING GREEK YPOGEGRAMMENI / IOTA
\r
3874 <utf-8>C2AB</utf-8>
\r
3875 <name>LEFT-POINTING DOUBLE ANGLE QUOTATION
\r
3881 <utf-8>C2BB</utf-8>
\r
3882 <name>RIGHT-POINTING DOUBLE ANGLE QUOTATION
\r
3888 <utf-8>E2809C</utf-8>
\r
3889 <name>LEFT DOUBLE QUOTATION MARK</name>
\r
3894 <utf-8>E2809D</utf-8>
\r
3895 <name>RIGHT DOUBLE QUOTATION MARK</name>
\r
3900 <utf-8>CDB4</utf-8>
\r
3901 <name>GREEK NUMERAL SIGN / UPPER PRIME</name>
\r
3906 <utf-8>CDB5</utf-8>
\r
3907 <name>GREEK LOWER NUMERAL SIGN / LOWER PRIME</name>
\r
3912 <utf-8>CE87</utf-8>
\r
3913 <name>GREEK ANO TELEIA / RAISED DOT, GREEK
\r
3919 <utf-8>CDBE</utf-8>
\r
3920 <name>GREEK QUESTION MARK</name>
\r
3925 <utf-8>CE91</utf-8>
\r
3926 <name>GREEK CAPITAL LETTER ALPHA</name>
\r
3931 <utf-8>CE92</utf-8>
\r
3932 <name>GREEK CAPITAL LETTER BETA</name>
\r
3937 <utf-8>CE93</utf-8>
\r
3938 <name>GREEK CAPITAL LETTER GAMMA</name>
\r
3943 <utf-8>CE94</utf-8>
\r
3944 <name>GREEK CAPITAL LETTER DELTA</name>
\r
3949 <utf-8>CE95</utf-8>
\r
3950 <name>GREEK CAPITAL LETTER EPSILON</name>
\r
3955 <utf-8>CF9A</utf-8>
\r
3956 <name>GREEK LETTER STIGMA</name>
\r
3961 <utf-8>CF9C</utf-8>
\r
3962 <name>GREEK LETTER DIGAMMA</name>
\r
3967 <utf-8>CE96</utf-8>
\r
3968 <name>GREEK CAPITAL LETTER ZETA</name>
\r
3973 <utf-8>CE97</utf-8>
\r
3974 <name>GREEK CAPITAL LETTER ETA</name>
\r
3979 <utf-8>CE98</utf-8>
\r
3980 <name>GREEK CAPITAL LETTER THETA</name>
\r
3985 <utf-8>CE99</utf-8>
\r
3986 <name>GREEK CAPITAL LETTER IOTA</name>
\r
3991 <utf-8>CE9A</utf-8>
\r
3992 <name>GREEK CAPITAL LETTER KAPPA</name>
\r
3997 <utf-8>CE9B</utf-8>
\r
3998 <name>GREEK CAPITAL LETTER LAMDA</name>
\r
4003 <utf-8>CE9C</utf-8>
\r
4004 <name>GREEK CAPITAL LETTER MU</name>
\r
4009 <utf-8>CE9D</utf-8>
\r
4010 <name>GREEK CAPITAL LETTER NU</name>
\r
4015 <utf-8>CE9E</utf-8>
\r
4016 <name>GREEK CAPITAL LETTER XI</name>
\r
4021 <utf-8>CE9F</utf-8>
\r
4022 <name>GREEK CAPITAL LETTER OMICRON</name>
\r
4027 <utf-8>CEA0</utf-8>
\r
4028 <name>GREEK CAPITAL LETTER PI</name>
\r
4033 <utf-8>CF9E</utf-8>
\r
4034 <name>GREEK LETTER KOPPA</name>
\r
4039 <utf-8>CEA1</utf-8>
\r
4040 <name>GREEK CAPITAL LETTER RHO</name>
\r
4045 <utf-8>CEA3</utf-8>
\r
4046 <name>GREEK CAPITAL LETTER SIGMA</name>
\r
4051 <utf-8>CEA4</utf-8>
\r
4052 <name>GREEK CAPITAL LETTER TAU</name>
\r
4057 <utf-8>CEA5</utf-8>
\r
4058 <name>GREEK CAPITAL LETTER UPSILON</name>
\r
4063 <utf-8>CEA6</utf-8>
\r
4064 <name>GREEK CAPITAL LETTER PHI</name>
\r
4069 <utf-8>CEA7</utf-8>
\r
4070 <name>GREEK CAPITAL LETTER CHI</name>
\r
4075 <utf-8>CEA8</utf-8>
\r
4076 <name>GREEK CAPITAL LETTER PSI</name>
\r
4081 <utf-8>CEA9</utf-8>
\r
4082 <name>GREEK CAPITAL LETTER OMEGA</name>
\r
4087 <utf-8>CFA0</utf-8>
\r
4088 <name>GREEK LETTER SAMPI</name>
\r
4093 <utf-8>CEB1</utf-8>
\r
4094 <name>GREEK SMALL LETTER ALPHA</name>
\r
4099 <utf-8>CEB2</utf-8>
\r
4100 <name>GREEK SMALL LETTER BETA / SMALL LETTER BETA
\r
4101 BEGINNING OF WORD</name>
\r
4106 <utf-8>CF90</utf-8>
\r
4107 <name>GREEK BETA SYMBOL / SMALL LETTER BETA MIDDLE OF
\r
4113 <utf-8>CEB3</utf-8>
\r
4114 <name>GREEK SMALL LETTER GAMMA</name>
\r
4119 <utf-8>CEB4</utf-8>
\r
4120 <name>GREEK SMALL LETTER DELTA</name>
\r
4125 <utf-8>CEB5</utf-8>
\r
4126 <name>GREEK SMALL LETTER EPSILON</name>
\r
4131 <utf-8>CF9B</utf-8>
\r
4132 <name>GREEK SMALL LETTER STIGMA</name>
\r
4137 <utf-8>CF9D</utf-8>
\r
4138 <name>GREEK SMALL LETTER DIGAMMA</name>
\r
4143 <utf-8>CEB6</utf-8>
\r
4144 <name>GREEK SMALL LETTER ZETA</name>
\r
4149 <utf-8>CEB7</utf-8>
\r
4150 <name>GREEK SMALL LETTER ETA</name>
\r
4155 <utf-8>CEB8</utf-8>
\r
4156 <name>GREEK SMALL LETTER THETA</name>
\r
4161 <utf-8>CEB9</utf-8>
\r
4162 <name>GREEK SMALL LETTER IOTA</name>
\r
4167 <utf-8>CEBA</utf-8>
\r
4168 <name>GREEK SMALL LETTER KAPPA</name>
\r
4173 <utf-8>CEBB</utf-8>
\r
4174 <name>GREEK SMALL LETTER LAMDA</name>
\r
4179 <utf-8>CEBC</utf-8>
\r
4180 <name>GREEK SMALL LETTER MU</name>
\r
4185 <utf-8>CEBD</utf-8>
\r
4186 <name>GREEK SMALL LETTER NU</name>
\r
4191 <utf-8>CEBE</utf-8>
\r
4192 <name>GREEK SMALL LETTER XI</name>
\r
4197 <utf-8>CEBF</utf-8>
\r
4198 <name>GREEK SMALL LETTER OMICRON</name>
\r
4203 <utf-8>CF80</utf-8>
\r
4204 <name>GREEK SMALL LETTER PI</name>
\r
4209 <utf-8>CF9F</utf-8>
\r
4210 <name>GREEK SMALL LETTER KOPPA</name>
\r
4215 <utf-8>CF81</utf-8>
\r
4216 <name>GREEK SMALL LETTER RHO</name>
\r
4221 <utf-8>CF83</utf-8>
\r
4222 <name>GREEK SMALL LETTER SIGMA</name>
\r
4227 <utf-8>CF82</utf-8>
\r
4228 <name>GREEK SMALL LETTER FINAL SIGMA / SMALL LETTER
\r
4229 SIGMA END OF WORD</name>
\r
4234 <utf-8>CF84</utf-8>
\r
4235 <name>GREEK SMALL LETTER TAU</name>
\r
4240 <utf-8>CF85</utf-8>
\r
4241 <name>GREEK SMALL LETTER UPSILON</name>
\r
4246 <utf-8>CF86</utf-8>
\r
4247 <name>GREEK SMALL LETTER PHI</name>
\r
4252 <utf-8>CF87</utf-8>
\r
4253 <name>GREEK SMALL LETTER CHI</name>
\r
4258 <utf-8>CF88</utf-8>
\r
4259 <name>GREEK SMALL LETTER PSI</name>
\r
4264 <utf-8>CF89</utf-8>
\r
4265 <name>GREEK SMALL LETTER OMEGA</name>
\r
4270 <utf-8>CFA1</utf-8>
\r
4271 <name>GREEK SMALL LETTER SAMPI</name>
\r