X-Git-Url: http://shamusworld.gotdns.org/cgi-bin/gitweb.cgi?a=blobdiff_plain;f=src%2Fcharnames.cpp;fp=src%2Fcharnames.cpp;h=5fec44024f271ef2a3f51817a0c702ca9d05d768;hb=c84263bb8b0d16e4c6da49aa0b7d0bc904ae02b1;hp=84eaf300f51e3a6a73cbbe9a4894a94e7d92032f;hpb=5c7c36b21d0f2a88accd8ff12c05dcc3004ce0e8;p=ttedit diff --git a/src/charnames.cpp b/src/charnames.cpp index 84eaf30..5fec440 100755 --- a/src/charnames.cpp +++ b/src/charnames.cpp @@ -1,2632 +1,2632 @@ -// -// CHARNAMES.CPP -// -// A header file that links Unicode character names to character numbers. -// by James L. Hammons -// (C) 2004 Underground Software -// -// JLH = James L. Hammons -// -// Who When What -// --- ---------- ------------------------------------------------------------- -// JLH ??/??/200? Created this file -// - -unsigned char macStdNames[] = { - "\x06""notdef" - "\x05"".null" - "\x02""CR" - "\x05""space" - "\x06""exclam" - "\x08""quotedbl" - "\x0A""numbersign" - "\x06""dollar" - "\x07""percent" - "\x09""ampersand" - "\x0B""quotesingle" - "\x09""parenleft" - "\x0A""parenright" - "\x08""asterisk" - "\x04""plus" - "\x05""comma" - "\x06""hyphen" - "\x06""period" - "\x05""slash" - "\x04""zero" - "\x03""one" - "\x03""two" - "\x05""three" - "\x04""four" - "\x04""five" - "\x03""six" - "\x05""seven" - "\x05""eight" - "\x04""nine" - "\x05""colon" - "\x09""semicolon" - "\x04""less" - "\x05""equal" - "\x07""greater" - "\x08""question" - "\x02""at" - "\x01""A" - "\x01""B" - "\x01""C" - "\x01""D" - "\x01""E" - "\x01""F" - "\x01""G" - "\x01""H" - "\x01""I" - "\x01""J" - "\x01""K" - "\x01""L" - "\x01""M" - "\x01""N" - "\x01""O" - "\x01""P" - "\x01""Q" - "\x01""R" - "\x01""S" - "\x01""T" - "\x01""U" - "\x01""V" - "\x01""W" - "\x01""X" - "\x01""Y" - "\x01""Z" - "\x0B""bracketleft" - "\x09""backslash" - "\x0C""bracketright" - "\x0B""asciicircum" - "\x0A""underscore" - "\x05""grave" - "\x01""a" - "\x01""b" - "\x01""c" - "\x01""d" - "\x01""e" - "\x01""f" - "\x01""g" - "\x01""h" - "\x01""i" - "\x01""j" - "\x01""k" - "\x01""l" - "\x01""m" - "\x01""n" - "\x01""o" - "\x01""p" - "\x01""q" - "\x01""r" - "\x01""s" - "\x01""t" - "\x01""u" - "\x01""v" - "\x01""w" - "\x01""x" - "\x01""y" - "\x01""z" - "\x09""braceleft" - "\x03""bar" - "\x0A""braceright" - "\x0A""asciitilde" - "\x09""Adieresis" - "\x05""Aring" - "\x08""Ccedilla" - "\x06""Eacute" - "\x06""Ntilde" - "\x09""Odieresis" - "\x09""Udieresis" - "\x06""aacute" - "\x06""agrave" - "\x0B""acircumflex" - "\x09""adieresis" - "\x06""atilde" - "\x05""aring" - "\x08""ccedilla" - "\x06""eacute" - "\x06""egrave" - "\x0B""ecircumflex" - "\x09""edieresis" - "\x06""iacute" - "\x06""igrave" - "\x0B""icircumflex" - "\x09""idieresis" - "\x06""ntilde" - "\x06""oacute" - "\x06""ograve" - "\x0B""ocircumflex" - "\x09""odieresis" - "\x06""otilde" - "\x06""uacute" - "\x06""ugrave" - "\x0B""ucircumflex" - "\x09""udieresis" - "\x06""dagger" - "\x06""degree" - "\x04""cent" - "\x08""sterling" - "\x07""section" - "\x06""bullet" - "\x09""paragraph" - "\x0A""germandbls" - "\x0A""registered" - "\x09""copyright" - "\x09""trademark" - "\x05""acute" - "\x08""dieresis" - "\x08""notequal" - "\x02""AE" - "\x06""Oslash" - "\x08""infinity" - "\x09""plusminus" - "\x09""lessequal" - "\x0C""greaterequal" - "\x03""yen" - "\x03""mu1" - "\x0B""partialdiff" - "\x09""summation" - "\x07""product" - "\x02""pi" - "\x08""integral" - "\x0B""ordfeminine" - "\x0C""ordmasculine" - "\x03""Ohm" - "\x02""ae" - "\x06""oslash" - "\x0C""questiondown" - "\x0A""exclamdown" - "\x0A""logicalnot" - "\x07""radical" - "\x06""florin" - "\x0B""approxequal" - "\x09""increment" - "\x0D""guillemotleft" - "\x0E""guillemotright" - "\x08""ellipsis" - "\x07""nbspace" - "\x06""Agrave" - "\x06""Atilde" - "\x06""Otilde" - "\x02""OE" - "\x02""oe" - "\x06""endash" - "\x06""emdash" - "\x0C""quotedblleft" - "\x0D""quotedblright" - "\x09""quoteleft" - "\x0A""quoteright" - "\x06""divide" - "\x07""lozenge" - "\x09""ydieresis" - "\x09""Ydieresis" - "\x08""fraction" - "\x08""currency" - "\x0D""guilsinglleft" - "\x0E""guilsinglright" - "\x02""fi" - "\x02""fl" - "\x09""daggerdbl" - "\x0E""periodcentered" - "\x0E""quotesinglbase" - "\x0C""quotedblbase" - "\x0B""perthousand" - "\x0B""Acircumflex" - "\x0B""Ecircumflex" - "\x06""Aacute" - "\x09""Edieresis" - "\x06""Egrave" - "\x06""Iacute" - "\x0B""Icircumflex" - "\x09""Idieresis" - "\x06""Igrave" - "\x06""Oacute" - "\x0B""Ocircumflex" - "\x09""applelogo" - "\x06""Ograve" - "\x06""Uacute" - "\x0B""Ucircumflex" - "\x06""Ugrave" - "\x08""dotlessi" - "\x0A""circumflex" - "\x05""tilde" - "\x09""overscore" - "\x05""breve" - "\x09""dotaccent" - "\x04""ring" - "\x07""cedilla" - "\x0C""hungarumlaut" - "\x06""ogonek" - "\x05""caron" - "\x06""Lslash" - "\x06""lslash" - "\x06""Scaron" - "\x06""scaron" - "\x06""Zcaron" - "\x06""zcaron" - "\x09""brokenbar" - "\x03""Eth" - "\x03""eth" - "\x06""Yacute" - "\x06""yacute" - "\x05""Thorn" - "\x05""thorn" - "\x05""minus" - "\x08""multiply" - "\x0B""onesuperior" - "\x0B""twosuperior" - "\x0D""threesuperior" - "\x07""onehalf" - "\x0A""onequarter" - "\x0D""threequarters" - "\x05""franc" - "\x06""Gbreve" - "\x06""gbreve" - "\x04""Idot" - "\x08""Scedilla" - "\x08""scedilla" - "\x06""Cacute" - "\x06""cacute" - "\x06""Ccaron" - "\x06""ccaron" - "\x07""dmacron" -}; - -/*struct unicodeChar -{ - int cNum; - -};*/ - -unsigned char unicodeChars[] = { - "\x00\x20""space\0" - "\x00\x21""exclamation mark\0" - "\x00\x22""quotation mark\0" - "\x00\x23""number sign\0" - -}; - -/* - -0023 NUMBER SIGN - = pound sign, hash, crosshatch, octothorpe -0024 DOLLAR SIGN - = milreis, escudo - * glyph may have one or two vertical bars - * other currency symbol characters: 20A0-20AF - x (currency sign - 00A4) -0025 PERCENT SIGN - x (arabic percent sign - 066A) - x (per mille sign - 2030) - x (per ten thousand sign - 2031) -0026 AMPERSAND -0027 APOSTROPHE - = APOSTROPHE-QUOTE - = APL quote - * neutral (vertical) glyph having mixed usage - * preferred character for apostrophe is 2019 - * preferred characters in English for paired quotation marks are 2018 & 2019 - x (modifier letter prime - 02B9) - x (modifier letter apostrophe - 02BC) - x (modifier letter vertical line - 02C8) - x (combining acute accent - 0301) - x (prime - 2032) -0028 LEFT PARENTHESIS - = OPENING PARENTHESIS -0029 RIGHT PARENTHESIS - = CLOSING PARENTHESIS - * see discussion on semantics of paired bracketing characters -002A ASTERISK - = star (on phone keypads) - x (arabic five pointed star - 066D) - x (asterisk operator - 2217) - x (heavy asterisk - 2731) -002B PLUS SIGN -002C COMMA - = decimal separator - x (arabic comma - 060C) - x (single low-9 quotation mark - 201A) - x (ideographic comma - 3001) -002D HYPHEN-MINUS - = hyphen or minus sign - * used for either hyphen or minus sign - x (hyphen - 2010) - x (non-breaking hyphen - 2011) - x (figure dash - 2012) - x (en dash - 2013) - x (minus sign - 2212) -002E FULL STOP - = PERIOD - = dot, decimal point - * may be rendered as a raised decimal point in old style numbers - x (arabic full stop - 06D4) - x (ideographic full stop - 3002) -002F SOLIDUS - = SLASH - = virgule, shilling (British) - x (latin letter dental click - 01C0) - x (combining long solidus overlay - 0338) - x (fraction slash - 2044) - x (division slash - 2215) -0030 DIGIT ZERO -0031 DIGIT ONE -0032 DIGIT TWO -0033 DIGIT THREE -0034 DIGIT FOUR -0035 DIGIT FIVE -0036 DIGIT SIX -0037 DIGIT SEVEN -0038 DIGIT EIGHT -0039 DIGIT NINE -003A COLON - x (armenian full stop - 0589) - x (hebrew punctuation sof pasuq - 05C3) - x (ratio - 2236) -003B SEMICOLON - x (greek question mark - 037E) - x (arabic semicolon - 061B) -003C LESS-THAN SIGN - x (single left-pointing angle quotation mark - 2039) - x (left-pointing angle bracket - 2329) - x (left angle bracket - 3008) -003D EQUALS SIGN - * other related characters: 2241-2263 - x (not equal to - 2260) - x (identical to - 2261) -003E GREATER-THAN SIGN - x (single right-pointing angle quotation mark - 203A) - x (right-pointing angle bracket - 232A) - x (right angle bracket - 3009) -003F QUESTION MARK - x (inverted question mark - 00BF) - x (greek question mark - 037E) - x (arabic question mark - 061F) - x (interrobang - 203D) - x (question exclamation mark - 2048) - x (exclamation question mark - 2049) -0040 COMMERCIAL AT -0041 LATIN CAPITAL LETTER A -0042 LATIN CAPITAL LETTER B - x (script capital b - 212C) -0043 LATIN CAPITAL LETTER C - x (double-struck capital c - 2102) - x (black-letter capital c - 212D) -0044 LATIN CAPITAL LETTER D -0045 LATIN CAPITAL LETTER E - x (euler constant - 2107) - x (script capital e - 2130) -0046 LATIN CAPITAL LETTER F - x (script capital f - 2131) - x (turned capital f - 2132) -0047 LATIN CAPITAL LETTER G -0048 LATIN CAPITAL LETTER H - x (script capital h - 210B) - x (black-letter capital h - 210C) - x (double-struck capital h - 210D) -0049 LATIN CAPITAL LETTER I - * Turkish and Azerbaijani use 0131 for lowercase - x (latin capital letter i with dot above - 0130) - x (cyrillic capital letter byelorussian-ukrainian i - 0406) - x (cyrillic letter palochka - 04C0) - x (script capital i - 2110) - x (black-letter capital i - 2111) - x (roman numeral one - 2160) -004A LATIN CAPITAL LETTER J -004B LATIN CAPITAL LETTER K - x (kelvin sign - 212A) -004C LATIN CAPITAL LETTER L - x (script capital l - 2112) -004D LATIN CAPITAL LETTER M - x (script capital m - 2133) -004E LATIN CAPITAL LETTER N - x (double-struck capital n - 2115) -004F LATIN CAPITAL LETTER O -0050 LATIN CAPITAL LETTER P - x (double-struck capital p - 2119) -0051 LATIN CAPITAL LETTER Q - x (double-struck capital q - 211A) -0052 LATIN CAPITAL LETTER R - x (script capital r - 211B) - x (black-letter capital r - 211C) - x (double-struck capital r - 211D) -0053 LATIN CAPITAL LETTER S -0054 LATIN CAPITAL LETTER T -0055 LATIN CAPITAL LETTER U -0056 LATIN CAPITAL LETTER V -0057 LATIN CAPITAL LETTER W -0058 LATIN CAPITAL LETTER X -0059 LATIN CAPITAL LETTER Y -005A LATIN CAPITAL LETTER Z - x (double-struck capital z - 2124) - x (black-letter capital z - 2128) -005B LEFT SQUARE BRACKET - = OPENING SQUARE BRACKET - * other bracket characters: 3008-301B -005C REVERSE SOLIDUS - = BACKSLASH - x (set minus - 2216) -005D RIGHT SQUARE BRACKET - = CLOSING SQUARE BRACKET -005E CIRCUMFLEX ACCENT - * this is a spacing character - x (modifier letter up arrowhead - 02C4) - x (modifier letter circumflex accent - 02C6) - x (combining circumflex accent - 0302) - x (up arrowhead - 2303) -005F LOW LINE - = SPACING UNDERSCORE - * this is a spacing character - x (modifier letter low macron - 02CD) - x (combining macron below - 0331) - x (combining low line - 0332) - x (double low line - 2017) -0060 GRAVE ACCENT - * this is a spacing character - x (modifier letter grave accent - 02CB) - x (combining grave accent - 0300) - x (reversed prime - 2035) -0061 LATIN SMALL LETTER A -0062 LATIN SMALL LETTER B -0063 LATIN SMALL LETTER C -0064 LATIN SMALL LETTER D -0065 LATIN SMALL LETTER E - x (estimated symbol - 212E) - x (script small e - 212F) -0066 LATIN SMALL LETTER F -0067 LATIN SMALL LETTER G - x (latin small letter script g - 0261) - x (script small g - 210A) -0068 LATIN SMALL LETTER H - x (cyrillic small letter shha - 04BB) - x (planck constant - 210E) -0069 LATIN SMALL LETTER I - * Turkish and Azerbaijani use 0130 for uppercase - x (latin small letter dotless i - 0131) -006A LATIN SMALL LETTER J -006B LATIN SMALL LETTER K -006C LATIN SMALL LETTER L - x (script small l - 2113) -006D LATIN SMALL LETTER M -006E LATIN SMALL LETTER N - x (superscript latin small letter n - 207F) -006F LATIN SMALL LETTER O - x (script small o - 2134) -0070 LATIN SMALL LETTER P -0071 LATIN SMALL LETTER Q -0072 LATIN SMALL LETTER R -0073 LATIN SMALL LETTER S -0074 LATIN SMALL LETTER T -0075 LATIN SMALL LETTER U -0076 LATIN SMALL LETTER V -0077 LATIN SMALL LETTER W -0078 LATIN SMALL LETTER X -0079 LATIN SMALL LETTER Y -007A LATIN SMALL LETTER Z - x (latin small letter z with stroke - 01B6) -007B LEFT CURLY BRACKET - = OPENING CURLY BRACKET - = opening brace -007C VERTICAL LINE - = VERTICAL BAR - * used in pairs to indicate absolute value - x (latin letter dental click - 01C0) - x (hebrew punctuation paseq - 05C0) - x (divides - 2223) - x (light vertical bar - 2758) -007D RIGHT CURLY BRACKET - = CLOSING CURLY BRACKET - = closing brace -007E TILDE - * this is a spacing character - x (small tilde - 02DC) - x (combining tilde - 0303) - x (tilde operator - 223C) - x (fullwidth tilde - FF5E) -007F - = DELETE -@@ 0080 C1 Controls and Latin-1 Supplement (Latin-1 Supplement) 00FF -@ C1 controls -@+ Alias names are those for ISO 6429. -0080 -0081 -0082 - = BREAK PERMITTED HERE -0083 - = NO BREAK HERE -0084 -0085 - = NEXT LINE -0086 - = START OF SELECTED AREA -0087 - = END OF SELECTED AREA -0088 - = CHARACTER TABULATION SET -0089 - = CHARACTER TABULATION WITH JUSTIFICATION -008A - = LINE TABULATION SET -008B - = PARTIAL LINE DOWN -008C - = PARTIAL LINE UP -008D - = REVERSE LINE FEED -008E - = SINGLE SHIFT TWO -008F - = SINGLE SHIFT THREE -0090 - = DEVICE CONTROL STRING -0091 - = PRIVATE USE ONE -0092 - = PRIVATE USE TWO -0093 - = SET TRANSMIT STATE -0094 - = CANCEL CHARACTER -0095 - = MESSAGE WAITING -0096 - = START OF GUARDED AREA -0097 - = END OF GUARDED AREA -0098 - = START OF STRING -0099 -009A - = SINGLE CHARACTER INTRODUCER -009B - = CONTROL SEQUENCE INTRODUCER -009C - = STRING TERMINATOR -009D - = OPERATING SYSTEM COMMAND -009E - = PRIVACY MESSAGE -009F - = APPLICATION PROGRAM COMMAND -@ ISO 8859-1 (aka Latin-1) -00A0 NO-BREAK SPACE - x (space - 0020) - x (figure space - 2007) - x (narrow no-break space - 202F) - x (zero width no-break space - FEFF) - # 0020 -00A1 INVERTED EXCLAMATION MARK - * Spanish, Asturian, Galician - x (exclamation mark - 0021) -00A2 CENT SIGN -00A3 POUND SIGN - = pound sterling, Irish punt - x (lira sign - 20A4) -00A4 CURRENCY SIGN - = Filzlaus, Ricardi-Sonne (German names) - * other currency symbol characters: 20A0-20AF - x (dollar sign - 0024) -00A5 YEN SIGN - = yuan sign - * glyph may have one or two crossbars -00A6 BROKEN BAR - = BROKEN VERTICAL BAR - = parted rule (in typography) -00A7 SECTION SIGN - * paragraph sign in some European usage -00A8 DIAERESIS - * this is a spacing character - x (combining diaeresis - 0308) - # 0020 0308 -00A9 COPYRIGHT SIGN - x (sound recording copyright - 2117) -00AA FEMININE ORDINAL INDICATOR - * Spanish - # 0061 -00AB LEFT-POINTING DOUBLE ANGLE QUOTATION MARK * - = LEFT POINTING GUILLEMET - = chevrons (in typography) - * usually opening, sometimes closing - x (much less-than - 226A) - x (left double angle bracket - 300A) -00AC NOT SIGN - = angled dash (in typography) - x (reversed not sign - 2310) -00AD SOFT HYPHEN - = discretionary hyphen - x (mongolian todo soft hyphen - 1806) -00AE REGISTERED SIGN - = REGISTERED TRADE MARK SIGN -00AF MACRON - = overline, APL overbar - * this is a spacing character - x (modifier letter macron - 02C9) - x (combining macron - 0304) - x (combining overline - 0305) - # 0020 0304 -00B0 DEGREE SIGN - * this is a spacing character - x (ring above - 02DA) - x (combining ring above - 030A) - x (superscript zero - 2070) - x (ring operator - 2218) -00B1 PLUS-MINUS SIGN - x (minus-or-plus sign - 2213) -00B2 SUPERSCRIPT TWO - = squared - * other superscript digit characters: 2070-2079 - x (superscript one - 00B9) - # 0032 -00B3 SUPERSCRIPT THREE - = cubed - x (superscript one - 00B9) - # 0033 -00B4 ACUTE ACCENT - * this is a spacing character - x (modifier letter prime - 02B9) - x (modifier letter acute accent - 02CA) - x (combining acute accent - 0301) - x (prime - 2032) - # 0020 0301 -00B5 MICRO SIGN - # 03BC greek small letter mu -00B6 PILCROW SIGN - = PARAGRAPH SIGN - * section sign in some European usage - x (reversed pilcrow sign - 204B) - x (curved stem paragraph sign ornament - 2761) -00B7 MIDDLE DOT - = midpoint (in typography) - = Georgian comma - = Greek middle dot - x (bullet - 2022) - x (one dot leader - 2024) - x (hyphenation point - 2027) - x (bullet operator - 2219) - x (dot operator - 22C5) - x (katakana middle dot - 30FB) -00B8 CEDILLA - * this is a spacing character - * other spacing accent characters: 02D8-02DB - x (combining cedilla - 0327) - # 0020 0327 -00B9 SUPERSCRIPT ONE - x (superscript two - 00B2) - x (superscript three - 00B3) - # 0031 -00BA MASCULINE ORDINAL INDICATOR - * Spanish - # 006F -00BB RIGHT-POINTING DOUBLE ANGLE QUOTATION MARK * - = RIGHT POINTING GUILLEMET - * usually closing, sometimes opening - x (much greater-than - 226B) - x (right double angle bracket - 300B) -00BC VULGAR FRACTION ONE QUARTER - * bar may be horizontal or slanted - * other fraction characters: 2153-215E - # 0031 2044 0034 -00BD VULGAR FRACTION ONE HALF - * bar may be horizontal or slanted - # 0031 2044 0032 -00BE VULGAR FRACTION THREE QUARTERS - * bar may be horizontal or slanted - # 0033 2044 0034 -00BF INVERTED QUESTION MARK - = turned question mark - * Spanish - x (question mark - 003F) -00C0 LATIN CAPITAL LETTER A WITH GRAVE - : 0041 0300 -00C1 LATIN CAPITAL LETTER A WITH ACUTE - : 0041 0301 -00C2 LATIN CAPITAL LETTER A WITH CIRCUMFLEX - : 0041 0302 -00C3 LATIN CAPITAL LETTER A WITH TILDE - : 0041 0303 -00C4 LATIN CAPITAL LETTER A WITH DIAERESIS - : 0041 0308 -00C5 LATIN CAPITAL LETTER A WITH RING ABOVE - x (angstrom sign - 212B) - : 0041 030A -00C6 LATIN CAPITAL LETTER AE (ash) * - = LATIN CAPITAL LIGATURE AE -00C7 LATIN CAPITAL LETTER C WITH CEDILLA - : 0043 0327 -00C8 LATIN CAPITAL LETTER E WITH GRAVE - : 0045 0300 -00C9 LATIN CAPITAL LETTER E WITH ACUTE - : 0045 0301 -00CA LATIN CAPITAL LETTER E WITH CIRCUMFLEX - : 0045 0302 -00CB LATIN CAPITAL LETTER E WITH DIAERESIS - : 0045 0308 -00CC LATIN CAPITAL LETTER I WITH GRAVE - : 0049 0300 -00CD LATIN CAPITAL LETTER I WITH ACUTE - : 0049 0301 -00CE LATIN CAPITAL LETTER I WITH CIRCUMFLEX - : 0049 0302 -00CF LATIN CAPITAL LETTER I WITH DIAERESIS - : 0049 0308 -00D0 LATIN CAPITAL LETTER ETH (Icelandic) - x (latin small letter eth - 00F0) - x (latin capital letter d with stroke - 0110) - x (latin capital letter african d - 0189) -00D1 LATIN CAPITAL LETTER N WITH TILDE - : 004E 0303 -00D2 LATIN CAPITAL LETTER O WITH GRAVE - : 004F 0300 -00D3 LATIN CAPITAL LETTER O WITH ACUTE - : 004F 0301 -00D4 LATIN CAPITAL LETTER O WITH CIRCUMFLEX - : 004F 0302 -00D5 LATIN CAPITAL LETTER O WITH TILDE - : 004F 0303 -00D6 LATIN CAPITAL LETTER O WITH DIAERESIS - : 004F 0308 -00D7 MULTIPLICATION SIGN - = z notation Cartesian product -00D8 LATIN CAPITAL LETTER O WITH STROKE - = LATIN CAPITAL LETTER O SLASH - x (empty set - 2205) -00D9 LATIN CAPITAL LETTER U WITH GRAVE - : 0055 0300 -00DA LATIN CAPITAL LETTER U WITH ACUTE - : 0055 0301 -00DB LATIN CAPITAL LETTER U WITH CIRCUMFLEX - : 0055 0302 -00DC LATIN CAPITAL LETTER U WITH DIAERESIS - : 0055 0308 -00DD LATIN CAPITAL LETTER Y WITH ACUTE - : 0059 0301 -00DE LATIN CAPITAL LETTER THORN (Icelandic) -00DF LATIN SMALL LETTER SHARP S (German) - = Eszett - * German - * uppercase is "SS" - * in origin a ligature of 017F and 0073 - x (greek small letter beta - 03B2) -00E0 LATIN SMALL LETTER A WITH GRAVE - : 0061 0300 -00E1 LATIN SMALL LETTER A WITH ACUTE - : 0061 0301 -00E2 LATIN SMALL LETTER A WITH CIRCUMFLEX - : 0061 0302 -00E3 LATIN SMALL LETTER A WITH TILDE - * Portuguese - : 0061 0303 -00E4 LATIN SMALL LETTER A WITH DIAERESIS - : 0061 0308 -00E5 LATIN SMALL LETTER A WITH RING ABOVE - * Danish, Norwegian, Swedish, Walloon - : 0061 030A -00E6 LATIN SMALL LETTER AE (ash) * - = LATIN SMALL LIGATURE AE - = ash (from Old English æsc) - * Danish, Norwegian, Icelandic, Faroese, Old English, French, IPA - x (latin small ligature oe - 0153) - x (cyrillic small ligature a ie - 04D5) -00E7 LATIN SMALL LETTER C WITH CEDILLA - : 0063 0327 -00E8 LATIN SMALL LETTER E WITH GRAVE - : 0065 0300 -00E9 LATIN SMALL LETTER E WITH ACUTE - : 0065 0301 -00EA LATIN SMALL LETTER E WITH CIRCUMFLEX - : 0065 0302 -00EB LATIN SMALL LETTER E WITH DIAERESIS - : 0065 0308 -00EC LATIN SMALL LETTER I WITH GRAVE - * Italian, Malagasy - : 0069 0300 -00ED LATIN SMALL LETTER I WITH ACUTE - : 0069 0301 -00EE LATIN SMALL LETTER I WITH CIRCUMFLEX - : 0069 0302 -00EF LATIN SMALL LETTER I WITH DIAERESIS - : 0069 0308 -00F0 LATIN SMALL LETTER ETH (Icelandic) - * Icelandic, Faroese, Old English, IPA - x (latin capital letter eth - 00D0) - x (greek small letter delta - 03B4) - x (partial differential - 2202) -00F1 LATIN SMALL LETTER N WITH TILDE - : 006E 0303 -00F2 LATIN SMALL LETTER O WITH GRAVE - : 006F 0300 -00F3 LATIN SMALL LETTER O WITH ACUTE - : 006F 0301 -00F4 LATIN SMALL LETTER O WITH CIRCUMFLEX - : 006F 0302 -00F5 LATIN SMALL LETTER O WITH TILDE - * Portuguese, Estonian - : 006F 0303 -00F6 LATIN SMALL LETTER O WITH DIAERESIS - : 006F 0308 -00F7 DIVISION SIGN -00F8 LATIN SMALL LETTER O WITH STROKE - = LATIN SMALL LETTER O SLASH - * Danish, Norwegian, Faroese, IPA -00F9 LATIN SMALL LETTER U WITH GRAVE - * French, Italian - : 0075 0300 -00FA LATIN SMALL LETTER U WITH ACUTE - : 0075 0301 -00FB LATIN SMALL LETTER U WITH CIRCUMFLEX - : 0075 0302 -00FC LATIN SMALL LETTER U WITH DIAERESIS - : 0075 0308 -00FD LATIN SMALL LETTER Y WITH ACUTE - * Czech, Slovak, Icelandic, Faroese, Welsh, Malagasy - : 0079 0301 -00FE LATIN SMALL LETTER THORN (Icelandic) - * Icelandic, Old English, phonetics - * Runic letter borrowed into Latin script - x (runic letter thurisaz thurs thorn - 16A6) -00FF LATIN SMALL LETTER Y WITH DIAERESIS - * French - x (latin capital letter y with diaeresis - 0178) - : 0079 0308 -@@ 0100 Latin Extended-A 017F -@ European Latin -0100 LATIN CAPITAL LETTER A WITH MACRON - : 0041 0304 -0101 LATIN SMALL LETTER A WITH MACRON - * Latvian, Latin, ... - : 0061 0304 -0102 LATIN CAPITAL LETTER A WITH BREVE - : 0041 0306 -0103 LATIN SMALL LETTER A WITH BREVE - * Romanian, Vietnamese, Latin, ... - : 0061 0306 -0104 LATIN CAPITAL LETTER A WITH OGONEK - : 0041 0328 -0105 LATIN SMALL LETTER A WITH OGONEK - * Polish, Lithuanian, ... - : 0061 0328 -0106 LATIN CAPITAL LETTER C WITH ACUTE - : 0043 0301 -0107 LATIN SMALL LETTER C WITH ACUTE - * Polish, Croatian, ... - x (cyrillic small letter tshe - 045B) - : 0063 0301 -0108 LATIN CAPITAL LETTER C WITH CIRCUMFLEX - : 0043 0302 -0109 LATIN SMALL LETTER C WITH CIRCUMFLEX - * Esperanto - : 0063 0302 -010A LATIN CAPITAL LETTER C WITH DOT ABOVE - : 0043 0307 -010B LATIN SMALL LETTER C WITH DOT ABOVE - * Maltese, Irish Gaelic (old orthography) - : 0063 0307 -010C LATIN CAPITAL LETTER C WITH CARON - : 0043 030C -010D LATIN SMALL LETTER C WITH CARON - * Czech, Slovak, Slovenian, and many other languages - : 0063 030C -010E LATIN CAPITAL LETTER D WITH CARON - * the form using caron/hacek is preferred in all contexts - : 0044 030C -010F LATIN SMALL LETTER D WITH CARON - * Czech, Slovak - * the form using apostrophe is preferred in typesetting - : 0064 030C -0110 LATIN CAPITAL LETTER D WITH STROKE - x (latin capital letter eth - 00D0) - x (latin small letter d with stroke - 0111) - x (latin capital letter african d - 0189) -0111 LATIN SMALL LETTER D WITH STROKE - * Croatian, Vietnamese, Sámi - x (latin capital letter d with stroke - 0110) - x (cyrillic small letter dje - 0452) -0112 LATIN CAPITAL LETTER E WITH MACRON - : 0045 0304 -0113 LATIN SMALL LETTER E WITH MACRON - * Latvian, Latin, ... - : 0065 0304 -0114 LATIN CAPITAL LETTER E WITH BREVE - : 0045 0306 -0115 LATIN SMALL LETTER E WITH BREVE - * Malay, Latin, ... - : 0065 0306 -0116 LATIN CAPITAL LETTER E WITH DOT ABOVE - : 0045 0307 -0117 LATIN SMALL LETTER E WITH DOT ABOVE - * Lithuanian - : 0065 0307 -0118 LATIN CAPITAL LETTER E WITH OGONEK - : 0045 0328 -0119 LATIN SMALL LETTER E WITH OGONEK - * Polish, Lithuanian, ... - : 0065 0328 -011A LATIN CAPITAL LETTER E WITH CARON - : 0045 030C -011B LATIN SMALL LETTER E WITH CARON - * Czech, ... - : 0065 030C -011C LATIN CAPITAL LETTER G WITH CIRCUMFLEX - : 0047 0302 -011D LATIN SMALL LETTER G WITH CIRCUMFLEX - * Esperanto - : 0067 0302 -011E LATIN CAPITAL LETTER G WITH BREVE - : 0047 0306 -011F LATIN SMALL LETTER G WITH BREVE - * Turkish, Azerbaijani - x (latin small letter g with caron - 01E7) - : 0067 0306 -0120 LATIN CAPITAL LETTER G WITH DOT ABOVE - : 0047 0307 -0121 LATIN SMALL LETTER G WITH DOT ABOVE - * Maltese, Irish Gaelic (old orthography) - : 0067 0307 -0122 LATIN CAPITAL LETTER G WITH CEDILLA - : 0047 0327 -0123 LATIN SMALL LETTER G WITH CEDILLA - * Latvian - * there are three major glyph variants - : 0067 0327 -0124 LATIN CAPITAL LETTER H WITH CIRCUMFLEX - : 0048 0302 -0125 LATIN SMALL LETTER H WITH CIRCUMFLEX - * Esperanto - : 0068 0302 -0126 LATIN CAPITAL LETTER H WITH STROKE -0127 LATIN SMALL LETTER H WITH STROKE - * Maltese, IPA, ... - x (cyrillic small letter tshe - 045B) - x (planck constant over two pi - 210F) -0128 LATIN CAPITAL LETTER I WITH TILDE - : 0049 0303 -0129 LATIN SMALL LETTER I WITH TILDE - * Greenlandic (old orthography) - : 0069 0303 -012A LATIN CAPITAL LETTER I WITH MACRON - : 0049 0304 -012B LATIN SMALL LETTER I WITH MACRON - * Latvian, Latin, ... - : 0069 0304 -012C LATIN CAPITAL LETTER I WITH BREVE - : 0049 0306 -012D LATIN SMALL LETTER I WITH BREVE - * Latin, ... - : 0069 0306 -012E LATIN CAPITAL LETTER I WITH OGONEK - : 0049 0328 -012F LATIN SMALL LETTER I WITH OGONEK - * Lithuanian, ... - : 0069 0328 -0130 LATIN CAPITAL LETTER I WITH DOT ABOVE - = LATIN CAPITAL LETTER I DOT - * Turkish, Azerbaijani - * lowercase is 0069 - x (latin capital letter i - 0049) - : 0049 0307 -0131 LATIN SMALL LETTER DOTLESS I - * Turkish, Azerbaijani - * uppercase is 0049 - x (latin small letter i - 0069) -0132 LATIN CAPITAL LIGATURE IJ - # 0049 004A -0133 LATIN SMALL LIGATURE IJ - * Dutch - # 0069 006A -0134 LATIN CAPITAL LETTER J WITH CIRCUMFLEX - : 004A 0302 -0135 LATIN SMALL LETTER J WITH CIRCUMFLEX - * Esperanto - : 006A 0302 -0136 LATIN CAPITAL LETTER K WITH CEDILLA - : 004B 0327 -0137 LATIN SMALL LETTER K WITH CEDILLA - * Latvian - : 006B 0327 -0138 LATIN SMALL LETTER KRA (Greenlandic) - * Greenlandic (old orthography) -0139 LATIN CAPITAL LETTER L WITH ACUTE - : 004C 0301 -013A LATIN SMALL LETTER L WITH ACUTE - * Slovak - : 006C 0301 -013B LATIN CAPITAL LETTER L WITH CEDILLA - : 004C 0327 -013C LATIN SMALL LETTER L WITH CEDILLA - * Latvian - : 006C 0327 -013D LATIN CAPITAL LETTER L WITH CARON - : 004C 030C -013E LATIN SMALL LETTER L WITH CARON - * Slovak - * the form using apostrophe is preferred in typesetting - : 006C 030C -013F LATIN CAPITAL LETTER L WITH MIDDLE DOT - * some fonts show the middle dot inside the L, but the preferred form has the dot following the L - # 004C 00B7 -0140 LATIN SMALL LETTER L WITH MIDDLE DOT - * Catalan - # 006C 00B7 -0141 LATIN CAPITAL LETTER L WITH STROKE -0142 LATIN SMALL LETTER L WITH STROKE - * Polish, ... - x (latin small letter l with bar - 019A) -0143 LATIN CAPITAL LETTER N WITH ACUTE - : 004E 0301 -0144 LATIN SMALL LETTER N WITH ACUTE - * Polish, ... - : 006E 0301 -0145 LATIN CAPITAL LETTER N WITH CEDILLA - : 004E 0327 -0146 LATIN SMALL LETTER N WITH CEDILLA - * Latvian - : 006E 0327 -0147 LATIN CAPITAL LETTER N WITH CARON - : 004E 030C -0148 LATIN SMALL LETTER N WITH CARON - * Czech, Slovak - : 006E 030C -0149 LATIN SMALL LETTER N PRECEDED BY APOSTROPHE - = LATIN SMALL LETTER APOSTROPHE N - * Afrikaans - * this is not actually a single letter - # 02BC 006E -014A LATIN CAPITAL LETTER ENG (Sami) - * glyph may also have appearance of large form of the small letter -014B LATIN SMALL LETTER ENG (Sami) - * Sámi, Mende, IPA, ... -014C LATIN CAPITAL LETTER O WITH MACRON - : 004F 0304 -014D LATIN SMALL LETTER O WITH MACRON - * Latvian, Latin, ... - : 006F 0304 -014E LATIN CAPITAL LETTER O WITH BREVE - : 004F 0306 -014F LATIN SMALL LETTER O WITH BREVE - * Latin - : 006F 0306 -0150 LATIN CAPITAL LETTER O WITH DOUBLE ACUTE - : 004F 030B -0151 LATIN SMALL LETTER O WITH DOUBLE ACUTE - * Hungarian - : 006F 030B -0152 LATIN CAPITAL LIGATURE OE -0153 LATIN SMALL LIGATURE OE - = LATIN SMALL LETTER O E - = ethel (from Old English eðel) - * French, IPA, Old Icelandic, Old English, ... - x (latin small letter ae - 00E6) - x (latin letter small capital oe - 0276) -0154 LATIN CAPITAL LETTER R WITH ACUTE - : 0052 0301 -0155 LATIN SMALL LETTER R WITH ACUTE - * Slovak, ... - : 0072 0301 -0156 LATIN CAPITAL LETTER R WITH CEDILLA - : 0052 0327 -0157 LATIN SMALL LETTER R WITH CEDILLA - * Latvian - : 0072 0327 -0158 LATIN CAPITAL LETTER R WITH CARON - : 0052 030C -0159 LATIN SMALL LETTER R WITH CARON - * Czech, ... - : 0072 030C -015A LATIN CAPITAL LETTER S WITH ACUTE - : 0053 0301 -015B LATIN SMALL LETTER S WITH ACUTE - * Polish, Indic transliteration, ... - : 0073 0301 -015C LATIN CAPITAL LETTER S WITH CIRCUMFLEX - : 0053 0302 -015D LATIN SMALL LETTER S WITH CIRCUMFLEX - * Esperanto - : 0073 0302 -015E LATIN CAPITAL LETTER S WITH CEDILLA * - : 0053 0327 -015F LATIN SMALL LETTER S WITH CEDILLA * - * Turkish, Azerbaijani, Romanian, ... - * this character is used in both Turkish and Romanian data - * a glyph variant with comma below is preferred for Romanian - x (latin small letter s with comma below - 0219) - : 0073 0327 -0160 LATIN CAPITAL LETTER S WITH CARON - : 0053 030C -0161 LATIN SMALL LETTER S WITH CARON - * Czech, Estonian, Finnish, Slovak, and many other languages - : 0073 030C -0162 LATIN CAPITAL LETTER T WITH CEDILLA * - : 0054 0327 -0163 LATIN SMALL LETTER T WITH CEDILLA * - * Romanian, Semitic transliteration, ... - * this character is used in Romanian data - * a glyph variant with comma below is preferred for Romanian - x (latin small letter t with comma below - 021B) - : 0074 0327 -0164 LATIN CAPITAL LETTER T WITH CARON - * the form using caron/hacek is preferred in all contexts - : 0054 030C -0165 LATIN SMALL LETTER T WITH CARON - * Czech, Slovak - * the form using apostrophe is preferred in typesetting - : 0074 030C -0166 LATIN CAPITAL LETTER T WITH STROKE -0167 LATIN SMALL LETTER T WITH STROKE - * Sámi -0168 LATIN CAPITAL LETTER U WITH TILDE - : 0055 0303 -0169 LATIN SMALL LETTER U WITH TILDE - * Greenlandic (old orthography) - : 0075 0303 -016A LATIN CAPITAL LETTER U WITH MACRON - : 0055 0304 -016B LATIN SMALL LETTER U WITH MACRON - * Latvian, Lithuanian, Latin, ... - : 0075 0304 -016C LATIN CAPITAL LETTER U WITH BREVE - : 0055 0306 -016D LATIN SMALL LETTER U WITH BREVE - * Latin, Esperanto, ... - : 0075 0306 -016E LATIN CAPITAL LETTER U WITH RING ABOVE - : 0055 030A -016F LATIN SMALL LETTER U WITH RING ABOVE - * Czech, ... - : 0075 030A -0170 LATIN CAPITAL LETTER U WITH DOUBLE ACUTE - : 0055 030B -0171 LATIN SMALL LETTER U WITH DOUBLE ACUTE - * Hungarian - : 0075 030B -0172 LATIN CAPITAL LETTER U WITH OGONEK - : 0055 0328 -0173 LATIN SMALL LETTER U WITH OGONEK - * Lithuanian - : 0075 0328 -0174 LATIN CAPITAL LETTER W WITH CIRCUMFLEX - : 0057 0302 -0175 LATIN SMALL LETTER W WITH CIRCUMFLEX - * Welsh - : 0077 0302 -0176 LATIN CAPITAL LETTER Y WITH CIRCUMFLEX - : 0059 0302 -0177 LATIN SMALL LETTER Y WITH CIRCUMFLEX - * Welsh - : 0079 0302 -0178 LATIN CAPITAL LETTER Y WITH DIAERESIS - * French, Igbo - x (latin small letter y with diaeresis - 00FF) - : 0059 0308 -0179 LATIN CAPITAL LETTER Z WITH ACUTE - : 005A 0301 -017A LATIN SMALL LETTER Z WITH ACUTE - * Polish, ... - : 007A 0301 -017B LATIN CAPITAL LETTER Z WITH DOT ABOVE - : 005A 0307 -017C LATIN SMALL LETTER Z WITH DOT ABOVE - * Polish, ... - : 007A 0307 -017D LATIN CAPITAL LETTER Z WITH CARON - : 005A 030C -017E LATIN SMALL LETTER Z WITH CARON - * Czech, Estonian, Finnish, Slovak, Slovenian, and many other languages - : 007A 030C -017F LATIN SMALL LETTER LONG S - * in common use in Roman types until the 18th century - * in current use in Fraktur and Gaelic types - # 0073 latin small letter s -@@ 0180 Latin Extended-B 024F -@ Latin extended-B -0180 LATIN SMALL LETTER B WITH STROKE - * Americanist and Indo-Europeanist usage for phonetic beta - * Old Saxon - x (greek small letter beta - 03B2) - x (blank symbol - 2422) -0181 LATIN CAPITAL LETTER B WITH HOOK - * Zulu, Pan-Nigerian alphabet - x (latin small letter b with hook - 0253) -0182 LATIN CAPITAL LETTER B WITH TOPBAR -0183 LATIN SMALL LETTER B WITH TOPBAR - * Zhuang - * former Soviet minority language scripts - x (cyrillic capital letter be - 0411) -0184 LATIN CAPITAL LETTER TONE SIX -0185 LATIN SMALL LETTER TONE SIX - * Zhuang - * Zhuang tone three is Cyrillic ze - * Zhuang tone four is Cyrillic che - x (latin small letter tone two - 01A8) - x (latin small letter tone five - 01BD) - x (cyrillic small letter ze - 0437) - x (cyrillic small letter che - 0447) - x (cyrillic small letter soft sign - 044C) -0186 LATIN CAPITAL LETTER OPEN O - * typographically a turned C - x (latin small letter open o - 0254) -0187 LATIN CAPITAL LETTER C WITH HOOK -0188 LATIN SMALL LETTER C WITH HOOK - * African -0189 LATIN CAPITAL LETTER AFRICAN D * - * Ewe - x (latin capital letter eth - 00D0) - x (latin capital letter d with stroke - 0110) - x (latin small letter d with tail - 0256) -018A LATIN CAPITAL LETTER D WITH HOOK - * Pan-Nigerian alphabet - x (latin small letter d with hook - 0257) -018B LATIN CAPITAL LETTER D WITH TOPBAR -018C LATIN SMALL LETTER D WITH TOPBAR - * former-Soviet minority language scripts -018D LATIN SMALL LETTER TURNED DELTA - * archaic phonetic for labialized dental fricative - * recommended spellings 007A 02B7 or 007A 032B -018E LATIN CAPITAL LETTER REVERSED E - = LATIN CAPITAL LETTER TURNED E - * Pan-Nigerian alphabet - * lowercase is 01DD -018F LATIN CAPITAL LETTER SCHWA - * Azerbaijani, ... - x (latin small letter schwa - 0259) - x (cyrillic capital letter schwa - 04D8) -0190 LATIN CAPITAL LETTER OPEN E - = LATIN CAPITAL LETTER EPSILON - * African - x (latin small letter open e - 025B) - x (euler constant - 2107) -0191 LATIN CAPITAL LETTER F WITH HOOK - * African -0192 LATIN SMALL LETTER F WITH HOOK - = LATIN SMALL LETTER SCRIPT F - = Florin currency symbol (Netherlands) - = function symbol - = abbreviation convention for folder -0193 LATIN CAPITAL LETTER G WITH HOOK - * African - x (latin small letter g with hook - 0260) -0194 LATIN CAPITAL LETTER GAMMA - * African - x (latin small letter gamma - 0263) -0195 LATIN SMALL LETTER HV (hwair) - * Gothic transliteration - * uppercase is 01F6 -0196 LATIN CAPITAL LETTER IOTA - * African - x (latin small letter iota - 0269) -0197 LATIN CAPITAL LETTER I WITH STROKE - = barred i, i bar - * African - * ISO 6438 gives lowercase as 026A, not 0268 - x (latin letter small capital i - 026A) -0198 LATIN CAPITAL LETTER K WITH HOOK -0199 LATIN SMALL LETTER K WITH HOOK - * Hausa, Pan-Nigerian alphabet -019A LATIN SMALL LETTER L WITH BAR - = barred l - * Americanist phonetic usage for 026C - x (latin small letter l with stroke - 0142) -019B LATIN SMALL LETTER LAMBDA WITH STROKE - = barred lambda, lambda bar - * Americanist phonetic usage -019C LATIN CAPITAL LETTER TURNED M - * Zhuang - x (latin small letter turned m - 026F) -019D LATIN CAPITAL LETTER N WITH LEFT HOOK - * African - x (latin small letter n with left hook - 0272) -019E LATIN SMALL LETTER N WITH LONG RIGHT LEG - * archaic phonetic for Japanese syllabic "n" - * recommended spelling 006E 0329 -019F LATIN CAPITAL LETTER O WITH MIDDLE TILDE * - = barred o, o bar - * lowercase is 0275 - * African - x (cyrillic capital letter barred o - 04E8) -01A0 LATIN CAPITAL LETTER O WITH HORN - : 004F 031B -01A1 LATIN SMALL LETTER O WITH HORN - * Vietnamese - : 006F 031B -01A2 LATIN CAPITAL LETTER OI (gha) -01A3 LATIN SMALL LETTER OI (gha) - = gha - * Pan-Turkic Latin alphabets -01A4 LATIN CAPITAL LETTER P WITH HOOK -01A5 LATIN SMALL LETTER P WITH HOOK - * African -01A6 LATIN LETTER YR * - * old Norse - * from German Standard DIN 31624 and ISO 5246-2 - * lowercase is 0280 -01A7 LATIN CAPITAL LETTER TONE TWO -01A8 LATIN SMALL LETTER TONE TWO - * Zhuang - * typographically a reversed S - x (latin small letter tone six - 0185) -01A9 LATIN CAPITAL LETTER ESH - * African - x (latin small letter esh - 0283) - x (greek capital letter sigma - 03A3) -01AA LATIN LETTER REVERSED ESH LOOP - * archaic phonetic for labialized palatoalveolar or palatal fricative - * Twi - * recommended spellings 0283 02B7, 00E7 02B7, 0068 0265, etc. -01AB LATIN SMALL LETTER T WITH PALATAL HOOK - * archaic phonetic for palatalized alveolar or dental stop - * recommended spelling 0074 02B2 -01AC LATIN CAPITAL LETTER T WITH HOOK -01AD LATIN SMALL LETTER T WITH HOOK - * African -01AE LATIN CAPITAL LETTER T WITH RETROFLEX HOOK - * African - x (latin small letter t with retroflex hook - 0288) -01AF LATIN CAPITAL LETTER U WITH HORN - : 0055 031B -01B0 LATIN SMALL LETTER U WITH HORN - * Vietnamese - : 0075 031B -01B1 LATIN CAPITAL LETTER UPSILON - * African - * typographically based on turned capital Greek omega - x (latin small letter upsilon - 028A) - x (inverted ohm sign - 2127) -01B2 LATIN CAPITAL LETTER V WITH HOOK - = LATIN CAPITAL LETTER SCRIPT V - * African - x (latin small letter v with hook - 028B) -01B3 LATIN CAPITAL LETTER Y WITH HOOK -01B4 LATIN SMALL LETTER Y WITH HOOK - * Bini, Esoko, and other Edo languages in West Africa -01B5 LATIN CAPITAL LETTER Z WITH STROKE -01B6 LATIN SMALL LETTER Z WITH STROKE - = barred z, z bar - * Pan-Turkic Latin orthography - * handwritten variant of Latin "z" - x (latin small letter z - 007A) -01B7 LATIN CAPITAL LETTER EZH - * African, Skolt Sámi - * lowercase is 0292 - x (latin capital letter yogh - 021C) - x (cyrillic capital letter abkhasian dze - 04E0) -01B8 LATIN CAPITAL LETTER EZH REVERSED -01B9 LATIN SMALL LETTER EZH REVERSED - * archaic phonetic for voiced pharyngeal fricative - * sometimes typographically rendered with a turned digit 3 - * recommended spelling 0295 - x (latin letter pharyngeal voiced fricative - 0295) - x (arabic letter ain - 0639) -01BA LATIN SMALL LETTER EZH WITH TAIL - * archaic phonetic for labialized voiced palatoalveolar or palatal fricative - * Twi - * recommended spellings 0292 02B7 or 006A 02B7 -01BB LATIN LETTER TWO WITH STROKE - * archaic phonetic for [dz] affricate - * recommended spellings 0292 or 0064 007A -01BC LATIN CAPITAL LETTER TONE FIVE -01BD LATIN SMALL LETTER TONE FIVE - * Zhuang - x (latin small letter tone six - 0185) -01BE LATIN LETTER INVERTED GLOTTAL STOP WITH STROKE - * archaic phonetic for [ts] affricate - * recommended spelling 0074 0073 - * letter form is actually derived from ligation of ts, rather than inverted glottal stop -01BF LATIN LETTER WYNN - = wen - * Runic letter borrowed into Latin script - * replaced by "w" in modern transcriptions of Old English - * uppercase is 01F7 - x (runic letter wunjo wynn w - 16B9) -01C0 LATIN LETTER DENTAL CLICK - = pipe - * Khoisan tradition - * "c" in Zulu orthography - x (solidus - 002F) - x (vertical line - 007C) - x (latin small letter turned t - 0287) - x (divides - 2223) -01C1 LATIN LETTER LATERAL CLICK - = double pipe - * Khoisan tradition - * "x" in Zulu orthography - x (latin letter inverted glottal stop - 0296) - x (parallel to - 2225) -01C2 LATIN LETTER ALVEOLAR CLICK - = double-barred pipe - * Khoisan tradition - x (not equal to - 2260) -01C3 LATIN LETTER RETROFLEX CLICK - = LATIN LETTER EXCLAMATION MARK - * Khoisan tradition - * "q" in Zulu orthography - x (exclamation mark - 0021) - x (latin letter stretched c - 0297) -@ Croatian digraphs matching Serbian Cyrillic letters -01C4 LATIN CAPITAL LETTER DZ WITH CARON - # 0044 017D -01C5 LATIN CAPITAL LETTER D WITH SMALL LETTER Z WITH CARON - # 0044 017E -01C6 LATIN SMALL LETTER DZ WITH CARON - x (cyrillic small letter dzhe - 045F) - # 0064 017E -01C7 LATIN CAPITAL LETTER LJ - # 004C 004A -01C8 LATIN CAPITAL LETTER L WITH SMALL LETTER J - # 004C 006A -01C9 LATIN SMALL LETTER LJ - x (cyrillic small letter lje - 0459) - # 006C 006A -01CA LATIN CAPITAL LETTER NJ - # 004E 004A -01CB LATIN CAPITAL LETTER N WITH SMALL LETTER J - # 004E 006A -01CC LATIN SMALL LETTER NJ - x (cyrillic small letter nje - 045A) - # 006E 006A -@ Pinyin diacritic-vowel combinations -01CD LATIN CAPITAL LETTER A WITH CARON - : 0041 030C -01CE LATIN SMALL LETTER A WITH CARON - * Pinyin third tone - : 0061 030C -01CF LATIN CAPITAL LETTER I WITH CARON - : 0049 030C -01D0 LATIN SMALL LETTER I WITH CARON - * Pinyin third tone - : 0069 030C -01D1 LATIN CAPITAL LETTER O WITH CARON - : 004F 030C -01D2 LATIN SMALL LETTER O WITH CARON - * Pinyin third tone - : 006F 030C -01D3 LATIN CAPITAL LETTER U WITH CARON - : 0055 030C -01D4 LATIN SMALL LETTER U WITH CARON - * Pinyin third tone - : 0075 030C -01D5 LATIN CAPITAL LETTER U WITH DIAERESIS AND MACRON - : 00DC 0304 -01D6 LATIN SMALL LETTER U WITH DIAERESIS AND MACRON - * Pinyin first tone - : 00FC 0304 -01D7 LATIN CAPITAL LETTER U WITH DIAERESIS AND ACUTE - : 00DC 0301 -01D8 LATIN SMALL LETTER U WITH DIAERESIS AND ACUTE - * Pinyin second tone - : 00FC 0301 -01D9 LATIN CAPITAL LETTER U WITH DIAERESIS AND CARON - : 00DC 030C -01DA LATIN SMALL LETTER U WITH DIAERESIS AND CARON - * Pinyin third tone - : 00FC 030C -01DB LATIN CAPITAL LETTER U WITH DIAERESIS AND GRAVE - : 00DC 0300 -01DC LATIN SMALL LETTER U WITH DIAERESIS AND GRAVE - * Pinyin fourth tone - : 00FC 0300 -@ Additions -01DD LATIN SMALL LETTER TURNED E - * Pan-Nigerian alphabet - * all other usages of schwa are 0259 - * uppercase is 018E - x (latin small letter schwa - 0259) -01DE LATIN CAPITAL LETTER A WITH DIAERESIS AND MACRON - : 00C4 0304 -01DF LATIN SMALL LETTER A WITH DIAERESIS AND MACRON - * Livonian, Uralicist usage - : 00E4 0304 -01E0 LATIN CAPITAL LETTER A WITH DOT ABOVE AND MACRON - : 0226 0304 -01E1 LATIN SMALL LETTER A WITH DOT ABOVE AND MACRON - * Uralicist usage - : 0227 0304 -01E2 LATIN CAPITAL LETTER AE WITH MACRON (ash) * - : 00C6 0304 -01E3 LATIN SMALL LETTER AE WITH MACRON (ash) * - * Old Norse, Old English - : 00E6 0304 -01E4 LATIN CAPITAL LETTER G WITH STROKE -01E5 LATIN SMALL LETTER G WITH STROKE - * Skolt Sámi -01E6 LATIN CAPITAL LETTER G WITH CARON - : 0047 030C -01E7 LATIN SMALL LETTER G WITH CARON - * Skolt Sámi - x (latin small letter g with breve - 011F) - : 0067 030C -01E8 LATIN CAPITAL LETTER K WITH CARON - : 004B 030C -01E9 LATIN SMALL LETTER K WITH CARON - * Skolt Sámi - : 006B 030C -01EA LATIN CAPITAL LETTER O WITH OGONEK - : 004F 0328 -01EB LATIN SMALL LETTER O WITH OGONEK - * Sámi, Iroquoian, Old Icelandic - : 006F 0328 -01EC LATIN CAPITAL LETTER O WITH OGONEK AND MACRON - : 01EA 0304 -01ED LATIN SMALL LETTER O WITH OGONEK AND MACRON - * Old Icelandic - : 01EB 0304 -01EE LATIN CAPITAL LETTER EZH WITH CARON - : 01B7 030C -01EF LATIN SMALL LETTER EZH WITH CARON - * Skolt Sámi - : 0292 030C -01F0 LATIN SMALL LETTER J WITH CARON - * IPA and many languages - : 006A 030C -01F1 LATIN CAPITAL LETTER DZ - # 0044 005A -01F2 LATIN CAPITAL LETTER D WITH SMALL LETTER Z - # 0044 007A -01F3 LATIN SMALL LETTER DZ - # 0064 007A -01F4 LATIN CAPITAL LETTER G WITH ACUTE - : 0047 0301 -01F5 LATIN SMALL LETTER G WITH ACUTE - * Macedonian and Serbian transliteration - : 0067 0301 -01F6 LATIN CAPITAL LETTER HWAIR - * lowercase is 0195 -01F7 LATIN CAPITAL LETTER WYNN - = wen - * lowercase is 01BF -01F8 LATIN CAPITAL LETTER N WITH GRAVE - : 004E 0300 -01F9 LATIN SMALL LETTER N WITH GRAVE - * Pinyin - : 006E 0300 -01FA LATIN CAPITAL LETTER A WITH RING ABOVE AND ACUTE - : 00C5 0301 -01FB LATIN SMALL LETTER A WITH RING ABOVE AND ACUTE - : 00E5 0301 -01FC LATIN CAPITAL LETTER AE WITH ACUTE (ash) * - : 00C6 0301 -01FD LATIN SMALL LETTER AE WITH ACUTE (ash) * - : 00E6 0301 -01FE LATIN CAPITAL LETTER O WITH STROKE AND ACUTE - : 00D8 0301 -01FF LATIN SMALL LETTER O WITH STROKE AND ACUTE - : 00F8 0301 -@ Additions for Slovenian and Croatian -0200 LATIN CAPITAL LETTER A WITH DOUBLE GRAVE - : 0041 030F -0201 LATIN SMALL LETTER A WITH DOUBLE GRAVE - : 0061 030F -0202 LATIN CAPITAL LETTER A WITH INVERTED BREVE - : 0041 0311 -0203 LATIN SMALL LETTER A WITH INVERTED BREVE - : 0061 0311 -0204 LATIN CAPITAL LETTER E WITH DOUBLE GRAVE - : 0045 030F -0205 LATIN SMALL LETTER E WITH DOUBLE GRAVE - : 0065 030F -0206 LATIN CAPITAL LETTER E WITH INVERTED BREVE - : 0045 0311 -0207 LATIN SMALL LETTER E WITH INVERTED BREVE - : 0065 0311 -0208 LATIN CAPITAL LETTER I WITH DOUBLE GRAVE - : 0049 030F -0209 LATIN SMALL LETTER I WITH DOUBLE GRAVE - : 0069 030F -020A LATIN CAPITAL LETTER I WITH INVERTED BREVE - : 0049 0311 -020B LATIN SMALL LETTER I WITH INVERTED BREVE - : 0069 0311 -020C LATIN CAPITAL LETTER O WITH DOUBLE GRAVE - : 004F 030F -020D LATIN SMALL LETTER O WITH DOUBLE GRAVE - : 006F 030F -020E LATIN CAPITAL LETTER O WITH INVERTED BREVE - : 004F 0311 -020F LATIN SMALL LETTER O WITH INVERTED BREVE - : 006F 0311 -0210 LATIN CAPITAL LETTER R WITH DOUBLE GRAVE - : 0052 030F -0211 LATIN SMALL LETTER R WITH DOUBLE GRAVE - : 0072 030F -0212 LATIN CAPITAL LETTER R WITH INVERTED BREVE - : 0052 0311 -0213 LATIN SMALL LETTER R WITH INVERTED BREVE - : 0072 0311 -0214 LATIN CAPITAL LETTER U WITH DOUBLE GRAVE - : 0055 030F -0215 LATIN SMALL LETTER U WITH DOUBLE GRAVE - : 0075 030F -0216 LATIN CAPITAL LETTER U WITH INVERTED BREVE - : 0055 0311 -0217 LATIN SMALL LETTER U WITH INVERTED BREVE - : 0075 0311 -@ Additions for Romanian -0218 LATIN CAPITAL LETTER S WITH COMMA BELOW * - : 0053 0326 -0219 LATIN SMALL LETTER S WITH COMMA BELOW * - * Romanian, when distinct comma below form is required - x (latin small letter s with cedilla - 015F) - : 0073 0326 -021A LATIN CAPITAL LETTER T WITH COMMA BELOW * - : 0054 0326 -021B LATIN SMALL LETTER T WITH COMMA BELOW * - * Romanian, when distinct comma below form is required - x (latin small letter t with cedilla - 0163) - : 0074 0326 -@ Miscellaneous additions -021C LATIN CAPITAL LETTER YOGH - x (latin capital letter ezh - 01B7) -021D LATIN SMALL LETTER YOGH - * Middle English, Scots - x (latin small letter ezh - 0292) - x (ounce sign - 2125) -021E LATIN CAPITAL LETTER H WITH CARON - : 0048 030C -021F LATIN SMALL LETTER H WITH CARON - * Finnish Romany - : 0068 030C -0222 LATIN CAPITAL LETTER OU -0223 LATIN SMALL LETTER OU - * Algonquin, Huron - x (digit eight - 0038) -0224 LATIN CAPITAL LETTER Z WITH HOOK -0225 LATIN SMALL LETTER Z WITH HOOK - * Middle High German -0226 LATIN CAPITAL LETTER A WITH DOT ABOVE - : 0041 0307 -0227 LATIN SMALL LETTER A WITH DOT ABOVE - * Uralicist usage - : 0061 0307 -0228 LATIN CAPITAL LETTER E WITH CEDILLA - : 0045 0327 -0229 LATIN SMALL LETTER E WITH CEDILLA - : 0065 0327 -@ Additions for Livonian -022A LATIN CAPITAL LETTER O WITH DIAERESIS AND MACRON - : 00D6 0304 -022B LATIN SMALL LETTER O WITH DIAERESIS AND MACRON - * Livonian - : 00F6 0304 -022C LATIN CAPITAL LETTER O WITH TILDE AND MACRON - : 00D5 0304 -022D LATIN SMALL LETTER O WITH TILDE AND MACRON - * Livonian - : 00F5 0304 -022E LATIN CAPITAL LETTER O WITH DOT ABOVE - : 004F 0307 -022F LATIN SMALL LETTER O WITH DOT ABOVE - * Livonian - : 006F 0307 -0230 LATIN CAPITAL LETTER O WITH DOT ABOVE AND MACRON - : 022E 0304 -0231 LATIN SMALL LETTER O WITH DOT ABOVE AND MACRON - * Livonian - : 022F 0304 -0232 LATIN CAPITAL LETTER Y WITH MACRON - : 0059 0304 -0233 LATIN SMALL LETTER Y WITH MACRON - * Livonian, Cornish - : 0079 0304 -@@ 0250 IPA Extensions 02AF -@ IPA extensions -@+ IPA includes basic Latin letters and a number of Latin letters from other blocks. - x (latin small letter ae - 00E6) - x (latin small letter c with cedilla - 00E7) - x (latin small letter eth - 00F0) - x (latin small letter o with stroke - 00F8) - x (latin small letter h with stroke - 0127) - x (latin small letter eng - 014B) - x (latin small ligature oe - 0153) - x (greek small letter beta - 03B2) - x (greek small letter theta - 03B8) - x (greek small letter lamda - 03BB) - x (greek small letter chi - 03C7) -0250 LATIN SMALL LETTER TURNED A - * low central unrounded vowel -0251 LATIN SMALL LETTER ALPHA - = LATIN SMALL LETTER SCRIPT A - * low back unrounded vowel - x (greek small letter alpha - 03B1) -0252 LATIN SMALL LETTER TURNED ALPHA - * low back rounded vowel -0253 LATIN SMALL LETTER B WITH HOOK - * implosive bilabial stop - * Pan-Nigerian alphabet - x (latin capital letter b with hook - 0181) -0254 LATIN SMALL LETTER OPEN O - * typographically a turned c - * lower-mid back rounded vowel - x (latin capital letter open o - 0186) -0255 LATIN SMALL LETTER C WITH CURL - * voiceless alveolo-palatal laminal fricative - * used in transcription of Mandarin Chinese - * sound spelled with 015B in Polish -0256 LATIN SMALL LETTER D WITH TAIL - = LATIN SMALL LETTER D RETROFLEX HOOK - * voiced retroflex stop - x (latin capital letter african d - 0189) -0257 LATIN SMALL LETTER D WITH HOOK - * implosive dental or alveolar stop - * Ewe, Pan-Nigerian alphabet - x (latin capital letter d with hook - 018A) -0258 LATIN SMALL LETTER REVERSED E - * upper-mid central unrounded vowel -0259 LATIN SMALL LETTER SCHWA - * mid-central unrounded vowel - * variant uppercase form 018E is associated with 01DD - x (latin capital letter schwa - 018F) - x (latin small letter turned e - 01DD) - x (cyrillic small letter schwa - 04D9) -025A LATIN SMALL LETTER SCHWA WITH HOOK - * rhotacized schwa -025B LATIN SMALL LETTER OPEN E - = LATIN SMALL LETTER EPSILON - * lower-mid front unrounded vowel - x (latin capital letter open e - 0190) - x (greek small letter epsilon - 03B5) -025C LATIN SMALL LETTER REVERSED OPEN E - * lower-mid central unrounded vowel -025D LATIN SMALL LETTER REVERSED OPEN E WITH HOOK - * rhotacized lower-mid central vowel -025E LATIN SMALL LETTER CLOSED REVERSED OPEN E - = LATIN SMALL LETTER CLOSED REVERSED EPSILON - * lower-mid central rounded vowel -025F LATIN SMALL LETTER DOTLESS J WITH STROKE - * voiced palatal stop - * typographically a turned f, but better thought of as a form of j - * "gy" in Hungarian orthography - * also archaic phonetic for palatoalveolar affricate 02A4 -0260 LATIN SMALL LETTER G WITH HOOK - * implosive velar stop - x (latin capital letter g with hook - 0193) -0261 LATIN SMALL LETTER SCRIPT G - * voiced velar stop - x (latin small letter g - 0067) -0262 LATIN LETTER SMALL CAPITAL G - * voiced uvular stop -0263 LATIN SMALL LETTER GAMMA - * voiced velar fricative - x (latin capital letter gamma - 0194) - x (greek small letter gamma - 03B3) -0264 LATIN SMALL LETTER RAMS HORN - = LATIN SMALL LETTER BABY GAMMA - * upper-mid back unrounded vowel -0265 LATIN SMALL LETTER TURNED H - * voiced rounded palatal approximant -0266 LATIN SMALL LETTER H WITH HOOK - * breathy-voiced glottal fricative - x (modifier letter small h with hook - 02B1) -0267 LATIN SMALL LETTER HENG WITH HOOK - * voiceless coarticulated velar and palatoalveolar fricative - * "tj" or "kj" or "sj" in some Swedish dialects -0268 LATIN SMALL LETTER I WITH STROKE - = barred i, i bar - * high central unrounded vowel - * ISO 6438 gives lowercase of 0197 as 026A, not 0268 -0269 LATIN SMALL LETTER IOTA - * semi-high front unrounded vowel -@+ * obsoleted by IPA in 1989 - * preferred use is 026A LATIN LETTER SMALL CAPITAL I - x (latin capital letter iota - 0196) - x (greek small letter iota - 03B9) -026A LATIN LETTER SMALL CAPITAL I - * semi-high front unrounded vowel - * preferred IPA alternate for 0269 - x (latin capital letter i with stroke - 0197) -026B LATIN SMALL LETTER L WITH MIDDLE TILDE - * velarized voiced alveolar lateral approximant -026C LATIN SMALL LETTER L WITH BELT - * voiceless alveolar lateral fricative -026D LATIN SMALL LETTER L WITH RETROFLEX HOOK - * voiced retroflex lateral -026E LATIN SMALL LETTER LEZH - * voiced lateral fricative - * "dhl" in Zulu orthography -026F LATIN SMALL LETTER TURNED M - * high back unrounded vowel - x (latin capital letter turned m - 019C) -0270 LATIN SMALL LETTER TURNED M WITH LONG LEG - * voiced velar approximant -0271 LATIN SMALL LETTER M WITH HOOK - * voiced labiodental nasal -0272 LATIN SMALL LETTER N WITH LEFT HOOK - * voiced palatal nasal - x (latin capital letter n with left hook - 019D) -0273 LATIN SMALL LETTER N WITH RETROFLEX HOOK - * voiced retroflex nasal -0274 LATIN LETTER SMALL CAPITAL N - * voiced uvular nasal -0275 LATIN SMALL LETTER BARRED O - = o bar - * rounded mid-central vowel, i.e. rounded schwa - * uppercase is 019F - x (greek small letter theta - 03B8) - x (cyrillic small letter fita - 0473) - x (cyrillic small letter barred o - 04E9) -0276 LATIN LETTER SMALL CAPITAL OE - * low front rounded vowel - x (latin small ligature oe - 0153) -0277 LATIN SMALL LETTER CLOSED OMEGA - * semi-high back rounded vowel -@+ * obsoleted by IPA in 1989 - * preferred use is 028A latin small letter upsilon -0278 LATIN SMALL LETTER PHI - * voiceless bilabial fricative - x (greek small letter phi - 03C6) -0279 LATIN SMALL LETTER TURNED R - * voiced alveolar approximant - x (modifier letter small turned r - 02B4) -027A LATIN SMALL LETTER TURNED R WITH LONG LEG - * voiced lateral flap -027B LATIN SMALL LETTER TURNED R WITH HOOK - * voiced retroflex approximant - x (modifier letter small turned r with hook - 02B5) -027C LATIN SMALL LETTER R WITH LONG LEG - * voiced strident apico-alveolar trill -@+ * obsoleted by IPA in 1989 - * sound spelled with 0159 in Czech - * preferred phonetic representation for Czech is 0072 031D - * in current use in Gaelic types (as glyph variant of 0072) -027D LATIN SMALL LETTER R WITH TAIL - * voiced retroflex flap -027E LATIN SMALL LETTER R WITH FISHHOOK - * voiced alveolar flap or tap -027F LATIN SMALL LETTER REVERSED R WITH FISHHOOK - * apical dental vowel - * used in Sinological tradition - * IPA spelling - 007A 0329 -0280 LATIN LETTER SMALL CAPITAL R * - * voiced uvular trill - * Germanic, Old Norse - * uppercase is 01A6 -0281 LATIN LETTER SMALL CAPITAL INVERTED R - * voiced uvular fricative or approximant - x (modifier letter small capital inverted r - 02B6) -0282 LATIN SMALL LETTER S WITH HOOK - * voiceless retroflex fricative -0283 LATIN SMALL LETTER ESH - * voiceless postalveolar fricative - x (latin capital letter esh - 01A9) - x (integral - 222B) -0284 LATIN SMALL LETTER DOTLESS J WITH STROKE AND HOOK - * implosive palatal stop - * typographically based on 025F, not on 0283 -0285 LATIN SMALL LETTER SQUAT REVERSED ESH - * apical retroflex vowel - * used in Sinological tradition - * IPA spelling - 0290 0329 -0286 LATIN SMALL LETTER ESH WITH CURL - * palatalized voiceless postalveolar fricative - * suggested spelling - 0283 02B2 -0287 LATIN SMALL LETTER TURNED T - * dental click (sound of "tsk tsk") - x (latin letter dental click - 01C0) -0288 LATIN SMALL LETTER T WITH RETROFLEX HOOK - * voiceless retroflex stop - x (latin capital letter t with retroflex hook - 01AE) -0289 LATIN SMALL LETTER U BAR - * high central rounded vowel -028A LATIN SMALL LETTER UPSILON - * semi-high back rounded vowel - * preferred IPA alternate to 0277 - x (latin capital letter upsilon - 01B1) - x (greek small letter upsilon - 03C5) -028B LATIN SMALL LETTER V WITH HOOK - = LATIN SMALL LETTER SCRIPT V - * voiced labiodental approximant - x (latin capital letter v with hook - 01B2) - x (greek small letter upsilon - 03C5) -028C LATIN SMALL LETTER TURNED V - = caret, wedge - * lower-mid back unrounded vowel - x (greek capital letter lamda - 039B) - x (caret - 2038) - x (logical and - 2227) -028D LATIN SMALL LETTER TURNED W - * voiceless rounded labiovelar approximant -028E LATIN SMALL LETTER TURNED Y - * voiced lateral approximant -028F LATIN LETTER SMALL CAPITAL Y - * semi-high front rounded vowel -0290 LATIN SMALL LETTER Z WITH RETROFLEX HOOK - * voiced retroflex fricative -0291 LATIN SMALL LETTER Z WITH CURL - * voiced alveolo-palatal laminal fricative - * sound spelled with 017A in Polish -0292 LATIN SMALL LETTER EZH - = LATIN SMALL LETTER YOGH - = dram - * voiced postalveolar fricative - * uppercase is 01B7 - * Skolt Sámi - x (latin small letter yogh - 021D) - x (cyrillic small letter abkhasian dze - 04E1) - x (ounce sign - 2125) -0293 LATIN SMALL LETTER EZH WITH CURL - * palatalized voiced postalveolar fricative -0294 LATIN LETTER GLOTTAL STOP - x (modifier letter glottal stop - 02C0) -0295 LATIN LETTER PHARYNGEAL VOICED FRICATIVE - = LATIN LETTER REVERSED GLOTTAL STOP - * voiced pharyngeal fricative - * ain - x (latin small letter ezh reversed - 01B9) - x (modifier letter reversed glottal stop - 02C1) -0296 LATIN LETTER INVERTED GLOTTAL STOP - * lateral click - x (latin letter lateral click - 01C1) -0297 LATIN LETTER STRETCHED C - * palatal (or alveolar) click - x (latin letter retroflex click - 01C3) - x (complement - 2201) -0298 LATIN LETTER BILABIAL CLICK - = LATIN LETTER BULLSEYE - x (circled dot operator - 2299) -0299 LATIN LETTER SMALL CAPITAL B - * bilabial trill -029A LATIN SMALL LETTER CLOSED OPEN E - = LATIN SMALL LETTER CLOSED EPSILON - * lower-mid front rounded vowel - * non-IPA alternate for the preferred 0153 -029B LATIN LETTER SMALL CAPITAL G WITH HOOK - * voiced uvular implosive -029C LATIN LETTER SMALL CAPITAL H - * voiceless epiglottal fricative -029D LATIN SMALL LETTER J WITH CROSSED-TAIL - * voiced palatal fricative -029E LATIN SMALL LETTER TURNED K - * proposed for velar click -@+ * withdrawn by IPA in 1970 -029F LATIN LETTER SMALL CAPITAL L - * velar lateral approximant -02A0 LATIN SMALL LETTER Q WITH HOOK - * voiceless uvular implosive -02A1 LATIN LETTER GLOTTAL STOP WITH STROKE - * voiced epiglottal stop -02A2 LATIN LETTER REVERSED GLOTTAL STOP WITH STROKE - * voiced epiglottal fricative -02A3 LATIN SMALL LETTER DZ DIGRAPH - * voiced dental affricate -02A4 LATIN SMALL LETTER DEZH DIGRAPH - * voiced postalveolar affricate -02A5 LATIN SMALL LETTER DZ DIGRAPH WITH CURL - * voiced alveolo-palatal affricate -02A6 LATIN SMALL LETTER TS DIGRAPH - * voiceless dental affricate -02A7 LATIN SMALL LETTER TESH DIGRAPH - * voiceless postalveolar affricate -02A8 LATIN SMALL LETTER TC DIGRAPH WITH CURL - * voiceless alveolo-palatal affricate -@ IPA characters for disordered speech -02A9 LATIN SMALL LETTER FENG DIGRAPH - * velopharyngeal fricative -02AA LATIN SMALL LETTER LS DIGRAPH - * lateral alveolar fricative (lisp) -02AB LATIN SMALL LETTER LZ DIGRAPH - * voiced lateral alveolar fricative -02AC LATIN LETTER BILABIAL PERCUSSIVE - * audible lip smack -02AD LATIN LETTER BIDENTAL PERCUSSIVE - * audible teeth gnashing -@@ 02B0 Spacing Modifier Letters 02FF -@ Phonetic modifiers derived from Latin letters -02B0 MODIFIER LETTER SMALL H - * aspiration - # 0068 -02B1 MODIFIER LETTER SMALL H WITH HOOK - * breathy voiced, murmured - x (latin small letter h with hook - 0266) - x (combining diaeresis below - 0324) - # 0266 -02B2 MODIFIER LETTER SMALL J - * palatalization - x (combining palatalized hook below - 0321) - # 006A -02B3 MODIFIER LETTER SMALL R - # 0072 -02B4 MODIFIER LETTER SMALL TURNED R - x (latin small letter turned r - 0279) - # 0279 -02B5 MODIFIER LETTER SMALL TURNED R WITH HOOK - x (latin small letter turned r with hook - 027B) - # 027B -02B6 MODIFIER LETTER SMALL CAPITAL INVERTED R - * preceding four used for r-coloring or r-offglides - x (latin letter small capital inverted r - 0281) - # 0281 -02B7 MODIFIER LETTER SMALL W - * labialization - x (combining inverted double arch below - 032B) - # 0077 -02B8 MODIFIER LETTER SMALL Y - * palatalization - * common Americanist substitution for 02B2 - # 0079 -@ Miscellaneous phonetic modifiers -02B9 MODIFIER LETTER PRIME - * primary stress, emphasis - * transliteration of mjagkij znak (Cyrillic soft sign: palatalization) - x (apostrophe - 0027) - x (acute accent - 00B4) - x (modifier letter acute accent - 02CA) - x (combining acute accent - 0301) - x (greek numeral sign - 0374) - x (prime - 2032) -02BA MODIFIER LETTER DOUBLE PRIME - * exaggerated stress, contrastive stress - * transliteration of tverdyj znak (Cyrillic hard sign: no palatalization) - x (quotation mark - 0022) - x (combining double acute accent - 030B) - x (double prime - 2033) -02BB MODIFIER LETTER TURNED COMMA - * typographical alternate for 02BD or 02BF - x (combining turned comma above - 0312) - x (left single quotation mark - 2018) -02BC MODIFIER LETTER APOSTROPHE - = apostrophe - * glottal stop, glottalization, ejective - * spacing clone of Greek smooth breathing mark - * many languages use this as a letter of their alphabets - x (apostrophe - 0027) - x (combining comma above - 0313) - x (combining comma above right - 0315) - x (armenian apostrophe - 055A) - x (right single quotation mark - 2019) -02BD MODIFIER LETTER REVERSED COMMA - * weak aspiration - * spacing clone of Greek rough breathing mark - x (combining reversed comma above - 0314) - x (armenian modifier letter left half ring - 0559) - x (single high-reversed-9 quotation mark - 201B) -02BE MODIFIER LETTER RIGHT HALF RING - * transliteration of Arabic hamza (glottal stop) - x (armenian apostrophe - 055A) - x (arabic letter hamza - 0621) -02BF MODIFIER LETTER LEFT HALF RING - * transliteration of Arabic ain (voiced pharyngeal fricative) - x (armenian modifier letter left half ring - 0559) - x (arabic letter ain - 0639) -02C0 MODIFIER LETTER GLOTTAL STOP - * ejective or glottalized - * typographical alternate for 02BC or 02BE - x (latin letter glottal stop - 0294) - x (combining hook above - 0309) -02C1 MODIFIER LETTER REVERSED GLOTTAL STOP - * typographical alternate for 02BF - x (latin letter pharyngeal voiced fricative - 0295) -02C2 MODIFIER LETTER LEFT ARROWHEAD - * fronted articulation -02C3 MODIFIER LETTER RIGHT ARROWHEAD - * backed articulation -02C4 MODIFIER LETTER UP ARROWHEAD - * raised articulation - x (circumflex accent - 005E) - x (up arrowhead - 2303) -02C5 MODIFIER LETTER DOWN ARROWHEAD - * lowered articulation -02C6 MODIFIER LETTER CIRCUMFLEX ACCENT - * rising-falling tone, falling tone, secondary stress, etc. - x (circumflex accent - 005E) - x (combining circumflex accent - 0302) -02C7 CARON (Mandarin Chinese third tone) - = hacek - * falling-rising tone - * Mandarin Chinese third tone - x (combining caron - 030C) -02C8 MODIFIER LETTER VERTICAL LINE - * primary stress, downstep - * precedes letter or syllable modified - x (apostrophe - 0027) - x (combining vertical line above - 030D) -02C9 MODIFIER LETTER MACRON (Mandarin Chinese first tone) - * high level tone - * precedes or follows letter or syllable modified - * Mandarin Chinese first tone - x (macron - 00AF) - x (combining macron - 0304) -02CA MODIFIER LETTER ACUTE ACCENT (Mandarin Chinese second tone) - * high-rising tone (IPA), high tone, primary stress - * Mandarin Chinese second tone - x (acute accent - 00B4) - x (modifier letter prime - 02B9) - x (combining acute accent - 0301) - x (greek numeral sign - 0374) - x (armenian emphasis mark - 055B) -02CB MODIFIER LETTER GRAVE ACCENT (Mandarin Chinese fourth tone) - * high-falling tone (IPA), low tone, secondary or tertiary stress - * Mandarin Chinese fourth tone - x (grave accent - 0060) - x (combining grave accent - 0300) - x (armenian comma - 055D) -02CC MODIFIER LETTER LOW VERTICAL LINE - * secondary stress - * precedes letter or syllable modified - x (combining vertical line below - 0329) -02CD MODIFIER LETTER LOW MACRON - * low level tone - x (low line - 005F) - x (combining macron below - 0331) -02CE MODIFIER LETTER LOW GRAVE ACCENT - * low-falling tone -02CF MODIFIER LETTER LOW ACUTE ACCENT - * low-rising tone - x (greek lower numeral sign - 0375) -02D0 MODIFIER LETTER TRIANGULAR COLON - * length mark - x (colon - 003A) -02D1 MODIFIER LETTER HALF TRIANGULAR COLON - * half-length mark - x (middle dot - 00B7) -02D2 MODIFIER LETTER CENTRED RIGHT HALF RING - * more rounded articulation -02D3 MODIFIER LETTER CENTRED LEFT HALF RING - * less rounded articulation -02D4 MODIFIER LETTER UP TACK - * vowel raising or closing - x (combining up tack below - 031D) - x (combining dot below - 0323) -02D5 MODIFIER LETTER DOWN TACK - * vowel lowering or opening - x (combining left half ring below - 031C) - x (combining down tack below - 031E) -02D6 MODIFIER LETTER PLUS SIGN - * advanced or fronted articulation - x (combining plus sign below - 031F) -02D7 MODIFIER LETTER MINUS SIGN - * retracted or backed articulation - * glyph may have small end-serifs - x (combining minus sign below - 0320) -@ Spacing clones of diacritics -02D8 BREVE - x (combining breve - 0306) - # 0020 0306 -02D9 DOT ABOVE (Mandarin Chinese light tone) - * Mandarin Chinese fifth tone (light or neutral) - x (combining dot above - 0307) - # 0020 0307 -02DA RING ABOVE - x (degree sign - 00B0) - x (combining ring above - 030A) - # 0020 030A -02DB OGONEK - x (combining ogonek - 0328) - # 0020 0328 -02DC SMALL TILDE - x (tilde - 007E) - x (combining tilde - 0303) - x (tilde operator - 223C) - # 0020 0303 -02DD DOUBLE ACUTE ACCENT - x (combining double acute accent - 030B) - # 0020 030B -@ Additions based on 1989 IPA -02DE MODIFIER LETTER RHOTIC HOOK - * rhotacization in vowel - * often ligated: 025A = 0259 + 02DE; 025D = 025C + 02DE -02DF MODIFIER LETTER CROSS ACCENT - * Swedish grave accent -02E0 MODIFIER LETTER SMALL GAMMA - * these modifier letters are occasionally used in transcription of affricates - # 0263 -02E1 MODIFIER LETTER SMALL L - # 006C -02E2 MODIFIER LETTER SMALL S - # 0073 -02E3 MODIFIER LETTER SMALL X - # 0078 -02E4 MODIFIER LETTER SMALL REVERSED GLOTTAL STOP - # 0295 -@ Tone letters -02E5 MODIFIER LETTER EXTRA-HIGH TONE BAR -02E6 MODIFIER LETTER HIGH TONE BAR -02E7 MODIFIER LETTER MID TONE BAR -02E8 MODIFIER LETTER LOW TONE BAR -02E9 MODIFIER LETTER EXTRA-LOW TONE BAR -02EA MODIFIER LETTER YIN DEPARTING TONE MARK -02EB MODIFIER LETTER YANG DEPARTING TONE MARK -@ IPA modifiers -02EC MODIFIER LETTER VOICING -02ED MODIFIER LETTER UNASPIRATED -@ Other modifier letters -02EE MODIFIER LETTER DOUBLE APOSTROPHE - -2000 EN QUAD - : 2002 en space -2001 EM QUAD - = mutton quad - : 2003 em space -2002 EN SPACE - = nut - * half an em - # 0020 space -2003 EM SPACE - = mutton - * nominally, a space equal to the type size in points - * may scale by the condensation factor of a font - # 0020 space -2004 THREE-PER-EM SPACE - = thick space - # 0020 space -2005 FOUR-PER-EM SPACE - = mid space - # 0020 space -2006 SIX-PER-EM SPACE - * in computer typography sometimes equated to thin space - # 0020 space -2007 FIGURE SPACE - * space equal to tabular width of a font - * this is equivalent to the digit width of fonts with fixed-width digits - # 0020 -2008 PUNCTUATION SPACE - * space equal to narrow punctuation of a font - # 0020 space -2009 THIN SPACE - * a fifth of an em (or sometimes a sixth) - # 0020 space -200A HAIR SPACE - * thinner than a thin space - * in traditional typography, the thinnest space available - # 0020 space -200B ZERO WIDTH SPACE - * nominally zero width, but may expand in justification -@ Formatting characters -200C ZERO WIDTH NON-JOINER - = ZWNJ -200D ZERO WIDTH JOINER - = ZWJ -200E LEFT-TO-RIGHT MARK - = LRM -200F RIGHT-TO-LEFT MARK - = RLM -@ Dashes -2010 HYPHEN - x (hyphen-minus - 002D) -2011 NON-BREAKING HYPHEN - x (hyphen-minus - 002D) - # 2010 -2012 FIGURE DASH -2013 EN DASH -2014 EM DASH - * may be used in pairs to offset parenthetical text - x (katakana-hiragana prolonged sound mark - 30FC) -2015 HORIZONTAL BAR - = QUOTATION DASH - * long dash introducing quoted text -@ General punctuation -2016 DOUBLE VERTICAL LINE - * used in pairs to indicate norm of a matrix - x (parallel to - 2225) -2017 DOUBLE LOW LINE - * this is a spacing character - x (low line - 005F) - x (combining double low line - 0333) - # 0020 0333 -2018 LEFT SINGLE QUOTATION MARK - = SINGLE TURNED COMMA QUOTATION MARK - * this is the preferred glyph (as opposed to 201B) - x (apostrophe - 0027) - x (modifier letter turned comma - 02BB) - x (heavy single turned comma quotation mark ornament - 275B) -2019 RIGHT SINGLE QUOTATION MARK - = SINGLE COMMA QUOTATION MARK - * this is the preferred character to use for apostrophe - x (apostrophe - 0027) - x (modifier letter apostrophe - 02BC) - x (heavy single comma quotation mark ornament - 275C) -201A SINGLE LOW-9 QUOTATION MARK - = LOW SINGLE COMMA QUOTATION MARK - * used as opening single quotation mark in some languages -201B SINGLE HIGH-REVERSED-9 QUOTATION MARK - = SINGLE REVERSED COMMA QUOTATION MARK - * glyph variant of 2018 - x (modifier letter reversed comma - 02BD) -201C LEFT DOUBLE QUOTATION MARK - = DOUBLE TURNED COMMA QUOTATION MARK - * this is the preferred glyph (as opposed to 201F) - x (quotation mark - 0022) - x (heavy double turned comma quotation mark ornament - 275D) - x (reversed double prime quotation mark - 301D) -201D RIGHT DOUBLE QUOTATION MARK - = DOUBLE COMMA QUOTATION MARK - x (quotation mark - 0022) - x (double prime - 2033) - x (heavy double comma quotation mark ornament - 275E) - x (double prime quotation mark - 301E) -201E DOUBLE LOW-9 QUOTATION MARK - = LOW DOUBLE COMMA QUOTATION MARK - * used as opening double quotation mark in some languages - x (low double prime quotation mark - 301F) -201F DOUBLE HIGH-REVERSED-9 QUOTATION MARK - = DOUBLE REVERSED COMMA QUOTATION MARK - * glyph variant of 201C -2020 DAGGER - = obelisk, obelus, long cross -2021 DOUBLE DAGGER - = diesis, double obelisk -2022 BULLET - = black small circle - x (middle dot - 00B7) - x (one dot leader - 2024) - x (bullet operator - 2219) - x (inverse bullet - 25D8) - x (white bullet - 25E6) -2023 TRIANGULAR BULLET - x (end of proof - 220E) - x (black right-pointing small triangle - 25B8) -2024 ONE DOT LEADER - x (middle dot - 00B7) - x (bullet - 2022) - x (bullet operator - 2219) - # 002E full stop -2025 TWO DOT LEADER - # 002E 002E -2026 HORIZONTAL ELLIPSIS - = three dot leader - x (vertical ellipsis - 22EE) - # 002E 002E 002E -2027 HYPHENATION POINT -@ Formatting characters -2028 LINE SEPARATOR - * may be used to represent this semantic unambiguously -2029 PARAGRAPH SEPARATOR - * may be used to represent this semantic unambiguously -202A LEFT-TO-RIGHT EMBEDDING - = LRE -202B RIGHT-TO-LEFT EMBEDDING - = RLE -202C POP DIRECTIONAL FORMATTING - = PDF -202D LEFT-TO-RIGHT OVERRIDE - = LRO -202E RIGHT-TO-LEFT OVERRIDE - = RLO -202F NARROW NO-BREAK SPACE - x (no-break space - 00A0) - # 0020 -@ General punctuation -2030 PER MILLE SIGN - x (percent sign - 0025) -2031 PER TEN THOUSAND SIGN - x (percent sign - 0025) -2032 PRIME - = minutes, feet - x (apostrophe - 0027) - x (acute accent - 00B4) - x (modifier letter prime - 02B9) -2033 DOUBLE PRIME - = seconds, inches - x (quotation mark - 0022) - x (modifier letter double prime - 02BA) - x (right double quotation mark - 201D) - x (ditto mark - 3003) - x (double prime quotation mark - 301E) - # 2032 2032 -2034 TRIPLE PRIME - # 2032 2032 2032 -2035 REVERSED PRIME - x (grave accent - 0060) -2036 REVERSED DOUBLE PRIME - x (reversed double prime quotation mark - 301D) - # 2035 2035 -2037 REVERSED TRIPLE PRIME - # 2035 2035 2035 -2038 CARET - x (up arrowhead - 2303) -2039 SINGLE LEFT-POINTING ANGLE QUOTATION MARK - = LEFT POINTING SINGLE GUILLEMET - * usually opening, sometimes closing - x (less-than sign - 003C) - x (left-pointing angle bracket - 2329) - x (left angle bracket - 3008) -203A SINGLE RIGHT-POINTING ANGLE QUOTATION MARK - = RIGHT POINTING SINGLE GUILLEMET - * usually closing, sometimes opening - x (greater-than sign - 003E) - x (right-pointing angle bracket - 232A) - x (right angle bracket - 3009) -203B REFERENCE MARK - = Japanese kome - = Urdu paragraph separator - x (tibetan ku ru kha bzhi mig can - 0FBF) -203C DOUBLE EXCLAMATION MARK - x (exclamation mark - 0021) - # 0021 0021 -203D INTERROBANG - x (exclamation mark - 0021) - x (question mark - 003F) -203E OVERLINE - = SPACING OVERSCORE - # 0020 0305 -203F UNDERTIE (Enotikon) - = Greek enotikon - x (smile - 2323) -2040 CHARACTER TIE - x (frown - 2322) -2041 CARET INSERTION POINT - * proofreader's mark: insert here - x (right semidirect product - 22CC) -2042 ASTERISM -2043 HYPHEN BULLET -2044 FRACTION SLASH - = solidus (in typography) - * for composing arbitrary fractions - x (solidus - 002F) - x (division slash - 2215) -2045 LEFT SQUARE BRACKET WITH QUILL -2046 RIGHT SQUARE BRACKET WITH QUILL -2048 QUESTION EXCLAMATION MARK - * designed for use in vertical text - # 003F 0021 -2049 EXCLAMATION QUESTION MARK - * designed for use in vertical text - # 0021 003F -204A TIRONIAN SIGN ET - * Irish Gaelic, ... -204B REVERSED PILCROW SIGN - x (pilcrow sign - 00B6) -204C BLACK LEFTWARDS BULLET -204D BLACK RIGHTWARDS BULLET -@ Deprecated -206A INHIBIT SYMMETRIC SWAPPING -206B ACTIVATE SYMMETRIC SWAPPING -206C INHIBIT ARABIC FORM SHAPING -206D ACTIVATE ARABIC FORM SHAPING -206E NATIONAL DIGIT SHAPES -206F NOMINAL DIGIT SHAPES -@@ 2070 Superscripts and Subscripts 209F -@ Superscripts -2070 SUPERSCRIPT ZERO - # 0030 -2071 - x (superscript one - 00B9) -2072 - x (superscript two - 00B2) -2073 - x (superscript three - 00B3) -2074 SUPERSCRIPT FOUR - # 0034 -2075 SUPERSCRIPT FIVE - # 0035 -2076 SUPERSCRIPT SIX - # 0036 -2077 SUPERSCRIPT SEVEN - # 0037 -2078 SUPERSCRIPT EIGHT - # 0038 -2079 SUPERSCRIPT NINE - # 0039 -207A SUPERSCRIPT PLUS SIGN - # 002B -207B SUPERSCRIPT MINUS - # 2212 -207C SUPERSCRIPT EQUALS SIGN - # 003D -207D SUPERSCRIPT LEFT PARENTHESIS - # 0028 -207E SUPERSCRIPT RIGHT PARENTHESIS - # 0029 -207F SUPERSCRIPT LATIN SMALL LETTER N - # 006E -@ Subscripts -2080 SUBSCRIPT ZERO - # 0030 -2081 SUBSCRIPT ONE - # 0031 -2082 SUBSCRIPT TWO - # 0032 -2083 SUBSCRIPT THREE - # 0033 -2084 SUBSCRIPT FOUR - # 0034 -2085 SUBSCRIPT FIVE - # 0035 -2086 SUBSCRIPT SIX - # 0036 -2087 SUBSCRIPT SEVEN - # 0037 -2088 SUBSCRIPT EIGHT - # 0038 -2089 SUBSCRIPT NINE - # 0039 -208A SUBSCRIPT PLUS SIGN - # 002B -208B SUBSCRIPT MINUS - # 2212 -208C SUBSCRIPT EQUALS SIGN - # 003D -208D SUBSCRIPT LEFT PARENTHESIS - # 0028 -208E SUBSCRIPT RIGHT PARENTHESIS - # 0029 -@@ 20A0 Currency Symbols 20CF -@ Currency symbols -@+ A number of currency symbols are found in other blocks. - x (dollar sign - 0024) - x (cent sign - 00A2) - x (pound sign - 00A3) - x (currency sign - 00A4) - x (yen sign - 00A5) - x (bengali rupee mark - 09F2) - x (bengali rupee sign - 09F3) - x (thai currency symbol baht - 0E3F) - x (khmer currency symbol riel - 17DB) -20A0 EURO-CURRENCY SIGN - * intended for ECU, but not widely used - * historical character, this is NOT the euro! - x (euro sign - 20AC) -20A1 COLON SIGN - * Costa Rica, El Salvador -20A2 CRUZEIRO SIGN - * Brazil -20A3 FRENCH FRANC SIGN - * France -20A4 LIRA SIGN - * Italy, Turkey - x (pound sign - 00A3) -20A5 MILL SIGN - * USA (1/10 cent) -20A6 NAIRA SIGN - * Nigeria -20A7 PESETA SIGN - * Spain -20A8 RUPEE SIGN - * India - # 0052 0073 -20A9 WON SIGN - * Korea -20AA NEW SHEQEL SIGN - * Israel -20AB DONG SIGN - * Vietnam -20AC EURO SIGN - * currency sign for the European Monetary Union - * euro, not ECU - x (euro-currency sign - 20A0) -20AD KIP SIGN - * Laos -20AE TUGRIK SIGN - * Mongolia - * also transliterated as tugrug, tugric, tugrog, togrog -20AF DRACHMA SIGN - * Greece -@@ 20D0 Combining Diacritical Marks for Symbols 20FF -@ Combining diacritical marks for symbols -20D0 COMBINING LEFT HARPOON ABOVE -20D1 COMBINING RIGHT HARPOON ABOVE - * vector -20D2 COMBINING LONG VERTICAL LINE OVERLAY -20D3 COMBINING SHORT VERTICAL LINE OVERLAY - * negation -20D4 COMBINING ANTICLOCKWISE ARROW ABOVE -20D5 COMBINING CLOCKWISE ARROW ABOVE - * rotation -20D6 COMBINING LEFT ARROW ABOVE -20D7 COMBINING RIGHT ARROW ABOVE - * vector -20D8 COMBINING RING OVERLAY -20D9 COMBINING CLOCKWISE RING OVERLAY -20DA COMBINING ANTICLOCKWISE RING OVERLAY -20DB COMBINING THREE DOTS ABOVE - = third derivative -20DC COMBINING FOUR DOTS ABOVE - = fourth derivative -@ Enclosing diacritics -20DD COMBINING ENCLOSING CIRCLE - = JIS composition circle - x (white circle - 25CB) - x (large circle - 25EF) - x (ideographic number zero - 3007) -20DE COMBINING ENCLOSING SQUARE - x (white square - 25A1) -20DF COMBINING ENCLOSING DIAMOND - x (white diamond - 25C7) -20E0 COMBINING ENCLOSING CIRCLE BACKSLASH - * prohibition -@ Additional diacritical mark for symbols -20E1 COMBINING LEFT RIGHT ARROW ABOVE - * tensor -@ Additional enclosing diacritics -20E2 COMBINING ENCLOSING SCREEN - x (clear screen symbol - 239A) -20E3 COMBINING ENCLOSING KEYCAP - -*/ - +// +// CHARNAMES.CPP +// +// A header file that links Unicode character names to character numbers. +// by James L. Hammons +// (C) 2004 Underground Software +// +// JLH = James L. Hammons +// +// Who When What +// --- ---------- ------------------------------------------------------------- +// JLH ??/??/200? Created this file +// + +unsigned char macStdNames[] = { + "\x06""notdef" + "\x05"".null" + "\x02""CR" + "\x05""space" + "\x06""exclam" + "\x08""quotedbl" + "\x0A""numbersign" + "\x06""dollar" + "\x07""percent" + "\x09""ampersand" + "\x0B""quotesingle" + "\x09""parenleft" + "\x0A""parenright" + "\x08""asterisk" + "\x04""plus" + "\x05""comma" + "\x06""hyphen" + "\x06""period" + "\x05""slash" + "\x04""zero" + "\x03""one" + "\x03""two" + "\x05""three" + "\x04""four" + "\x04""five" + "\x03""six" + "\x05""seven" + "\x05""eight" + "\x04""nine" + "\x05""colon" + "\x09""semicolon" + "\x04""less" + "\x05""equal" + "\x07""greater" + "\x08""question" + "\x02""at" + "\x01""A" + "\x01""B" + "\x01""C" + "\x01""D" + "\x01""E" + "\x01""F" + "\x01""G" + "\x01""H" + "\x01""I" + "\x01""J" + "\x01""K" + "\x01""L" + "\x01""M" + "\x01""N" + "\x01""O" + "\x01""P" + "\x01""Q" + "\x01""R" + "\x01""S" + "\x01""T" + "\x01""U" + "\x01""V" + "\x01""W" + "\x01""X" + "\x01""Y" + "\x01""Z" + "\x0B""bracketleft" + "\x09""backslash" + "\x0C""bracketright" + "\x0B""asciicircum" + "\x0A""underscore" + "\x05""grave" + "\x01""a" + "\x01""b" + "\x01""c" + "\x01""d" + "\x01""e" + "\x01""f" + "\x01""g" + "\x01""h" + "\x01""i" + "\x01""j" + "\x01""k" + "\x01""l" + "\x01""m" + "\x01""n" + "\x01""o" + "\x01""p" + "\x01""q" + "\x01""r" + "\x01""s" + "\x01""t" + "\x01""u" + "\x01""v" + "\x01""w" + "\x01""x" + "\x01""y" + "\x01""z" + "\x09""braceleft" + "\x03""bar" + "\x0A""braceright" + "\x0A""asciitilde" + "\x09""Adieresis" + "\x05""Aring" + "\x08""Ccedilla" + "\x06""Eacute" + "\x06""Ntilde" + "\x09""Odieresis" + "\x09""Udieresis" + "\x06""aacute" + "\x06""agrave" + "\x0B""acircumflex" + "\x09""adieresis" + "\x06""atilde" + "\x05""aring" + "\x08""ccedilla" + "\x06""eacute" + "\x06""egrave" + "\x0B""ecircumflex" + "\x09""edieresis" + "\x06""iacute" + "\x06""igrave" + "\x0B""icircumflex" + "\x09""idieresis" + "\x06""ntilde" + "\x06""oacute" + "\x06""ograve" + "\x0B""ocircumflex" + "\x09""odieresis" + "\x06""otilde" + "\x06""uacute" + "\x06""ugrave" + "\x0B""ucircumflex" + "\x09""udieresis" + "\x06""dagger" + "\x06""degree" + "\x04""cent" + "\x08""sterling" + "\x07""section" + "\x06""bullet" + "\x09""paragraph" + "\x0A""germandbls" + "\x0A""registered" + "\x09""copyright" + "\x09""trademark" + "\x05""acute" + "\x08""dieresis" + "\x08""notequal" + "\x02""AE" + "\x06""Oslash" + "\x08""infinity" + "\x09""plusminus" + "\x09""lessequal" + "\x0C""greaterequal" + "\x03""yen" + "\x03""mu1" + "\x0B""partialdiff" + "\x09""summation" + "\x07""product" + "\x02""pi" + "\x08""integral" + "\x0B""ordfeminine" + "\x0C""ordmasculine" + "\x03""Ohm" + "\x02""ae" + "\x06""oslash" + "\x0C""questiondown" + "\x0A""exclamdown" + "\x0A""logicalnot" + "\x07""radical" + "\x06""florin" + "\x0B""approxequal" + "\x09""increment" + "\x0D""guillemotleft" + "\x0E""guillemotright" + "\x08""ellipsis" + "\x07""nbspace" + "\x06""Agrave" + "\x06""Atilde" + "\x06""Otilde" + "\x02""OE" + "\x02""oe" + "\x06""endash" + "\x06""emdash" + "\x0C""quotedblleft" + "\x0D""quotedblright" + "\x09""quoteleft" + "\x0A""quoteright" + "\x06""divide" + "\x07""lozenge" + "\x09""ydieresis" + "\x09""Ydieresis" + "\x08""fraction" + "\x08""currency" + "\x0D""guilsinglleft" + "\x0E""guilsinglright" + "\x02""fi" + "\x02""fl" + "\x09""daggerdbl" + "\x0E""periodcentered" + "\x0E""quotesinglbase" + "\x0C""quotedblbase" + "\x0B""perthousand" + "\x0B""Acircumflex" + "\x0B""Ecircumflex" + "\x06""Aacute" + "\x09""Edieresis" + "\x06""Egrave" + "\x06""Iacute" + "\x0B""Icircumflex" + "\x09""Idieresis" + "\x06""Igrave" + "\x06""Oacute" + "\x0B""Ocircumflex" + "\x09""applelogo" + "\x06""Ograve" + "\x06""Uacute" + "\x0B""Ucircumflex" + "\x06""Ugrave" + "\x08""dotlessi" + "\x0A""circumflex" + "\x05""tilde" + "\x09""overscore" + "\x05""breve" + "\x09""dotaccent" + "\x04""ring" + "\x07""cedilla" + "\x0C""hungarumlaut" + "\x06""ogonek" + "\x05""caron" + "\x06""Lslash" + "\x06""lslash" + "\x06""Scaron" + "\x06""scaron" + "\x06""Zcaron" + "\x06""zcaron" + "\x09""brokenbar" + "\x03""Eth" + "\x03""eth" + "\x06""Yacute" + "\x06""yacute" + "\x05""Thorn" + "\x05""thorn" + "\x05""minus" + "\x08""multiply" + "\x0B""onesuperior" + "\x0B""twosuperior" + "\x0D""threesuperior" + "\x07""onehalf" + "\x0A""onequarter" + "\x0D""threequarters" + "\x05""franc" + "\x06""Gbreve" + "\x06""gbreve" + "\x04""Idot" + "\x08""Scedilla" + "\x08""scedilla" + "\x06""Cacute" + "\x06""cacute" + "\x06""Ccaron" + "\x06""ccaron" + "\x07""dmacron" +}; + +/*struct unicodeChar +{ + int cNum; + +};*/ + +unsigned char unicodeChars[] = { + "\x00\x20""space\0" + "\x00\x21""exclamation mark\0" + "\x00\x22""quotation mark\0" + "\x00\x23""number sign\0" + +}; + +/* + +0023 NUMBER SIGN + = pound sign, hash, crosshatch, octothorpe +0024 DOLLAR SIGN + = milreis, escudo + * glyph may have one or two vertical bars + * other currency symbol characters: 20A0-20AF + x (currency sign - 00A4) +0025 PERCENT SIGN + x (arabic percent sign - 066A) + x (per mille sign - 2030) + x (per ten thousand sign - 2031) +0026 AMPERSAND +0027 APOSTROPHE + = APOSTROPHE-QUOTE + = APL quote + * neutral (vertical) glyph having mixed usage + * preferred character for apostrophe is 2019 + * preferred characters in English for paired quotation marks are 2018 & 2019 + x (modifier letter prime - 02B9) + x (modifier letter apostrophe - 02BC) + x (modifier letter vertical line - 02C8) + x (combining acute accent - 0301) + x (prime - 2032) +0028 LEFT PARENTHESIS + = OPENING PARENTHESIS +0029 RIGHT PARENTHESIS + = CLOSING PARENTHESIS + * see discussion on semantics of paired bracketing characters +002A ASTERISK + = star (on phone keypads) + x (arabic five pointed star - 066D) + x (asterisk operator - 2217) + x (heavy asterisk - 2731) +002B PLUS SIGN +002C COMMA + = decimal separator + x (arabic comma - 060C) + x (single low-9 quotation mark - 201A) + x (ideographic comma - 3001) +002D HYPHEN-MINUS + = hyphen or minus sign + * used for either hyphen or minus sign + x (hyphen - 2010) + x (non-breaking hyphen - 2011) + x (figure dash - 2012) + x (en dash - 2013) + x (minus sign - 2212) +002E FULL STOP + = PERIOD + = dot, decimal point + * may be rendered as a raised decimal point in old style numbers + x (arabic full stop - 06D4) + x (ideographic full stop - 3002) +002F SOLIDUS + = SLASH + = virgule, shilling (British) + x (latin letter dental click - 01C0) + x (combining long solidus overlay - 0338) + x (fraction slash - 2044) + x (division slash - 2215) +0030 DIGIT ZERO +0031 DIGIT ONE +0032 DIGIT TWO +0033 DIGIT THREE +0034 DIGIT FOUR +0035 DIGIT FIVE +0036 DIGIT SIX +0037 DIGIT SEVEN +0038 DIGIT EIGHT +0039 DIGIT NINE +003A COLON + x (armenian full stop - 0589) + x (hebrew punctuation sof pasuq - 05C3) + x (ratio - 2236) +003B SEMICOLON + x (greek question mark - 037E) + x (arabic semicolon - 061B) +003C LESS-THAN SIGN + x (single left-pointing angle quotation mark - 2039) + x (left-pointing angle bracket - 2329) + x (left angle bracket - 3008) +003D EQUALS SIGN + * other related characters: 2241-2263 + x (not equal to - 2260) + x (identical to - 2261) +003E GREATER-THAN SIGN + x (single right-pointing angle quotation mark - 203A) + x (right-pointing angle bracket - 232A) + x (right angle bracket - 3009) +003F QUESTION MARK + x (inverted question mark - 00BF) + x (greek question mark - 037E) + x (arabic question mark - 061F) + x (interrobang - 203D) + x (question exclamation mark - 2048) + x (exclamation question mark - 2049) +0040 COMMERCIAL AT +0041 LATIN CAPITAL LETTER A +0042 LATIN CAPITAL LETTER B + x (script capital b - 212C) +0043 LATIN CAPITAL LETTER C + x (double-struck capital c - 2102) + x (black-letter capital c - 212D) +0044 LATIN CAPITAL LETTER D +0045 LATIN CAPITAL LETTER E + x (euler constant - 2107) + x (script capital e - 2130) +0046 LATIN CAPITAL LETTER F + x (script capital f - 2131) + x (turned capital f - 2132) +0047 LATIN CAPITAL LETTER G +0048 LATIN CAPITAL LETTER H + x (script capital h - 210B) + x (black-letter capital h - 210C) + x (double-struck capital h - 210D) +0049 LATIN CAPITAL LETTER I + * Turkish and Azerbaijani use 0131 for lowercase + x (latin capital letter i with dot above - 0130) + x (cyrillic capital letter byelorussian-ukrainian i - 0406) + x (cyrillic letter palochka - 04C0) + x (script capital i - 2110) + x (black-letter capital i - 2111) + x (roman numeral one - 2160) +004A LATIN CAPITAL LETTER J +004B LATIN CAPITAL LETTER K + x (kelvin sign - 212A) +004C LATIN CAPITAL LETTER L + x (script capital l - 2112) +004D LATIN CAPITAL LETTER M + x (script capital m - 2133) +004E LATIN CAPITAL LETTER N + x (double-struck capital n - 2115) +004F LATIN CAPITAL LETTER O +0050 LATIN CAPITAL LETTER P + x (double-struck capital p - 2119) +0051 LATIN CAPITAL LETTER Q + x (double-struck capital q - 211A) +0052 LATIN CAPITAL LETTER R + x (script capital r - 211B) + x (black-letter capital r - 211C) + x (double-struck capital r - 211D) +0053 LATIN CAPITAL LETTER S +0054 LATIN CAPITAL LETTER T +0055 LATIN CAPITAL LETTER U +0056 LATIN CAPITAL LETTER V +0057 LATIN CAPITAL LETTER W +0058 LATIN CAPITAL LETTER X +0059 LATIN CAPITAL LETTER Y +005A LATIN CAPITAL LETTER Z + x (double-struck capital z - 2124) + x (black-letter capital z - 2128) +005B LEFT SQUARE BRACKET + = OPENING SQUARE BRACKET + * other bracket characters: 3008-301B +005C REVERSE SOLIDUS + = BACKSLASH + x (set minus - 2216) +005D RIGHT SQUARE BRACKET + = CLOSING SQUARE BRACKET +005E CIRCUMFLEX ACCENT + * this is a spacing character + x (modifier letter up arrowhead - 02C4) + x (modifier letter circumflex accent - 02C6) + x (combining circumflex accent - 0302) + x (up arrowhead - 2303) +005F LOW LINE + = SPACING UNDERSCORE + * this is a spacing character + x (modifier letter low macron - 02CD) + x (combining macron below - 0331) + x (combining low line - 0332) + x (double low line - 2017) +0060 GRAVE ACCENT + * this is a spacing character + x (modifier letter grave accent - 02CB) + x (combining grave accent - 0300) + x (reversed prime - 2035) +0061 LATIN SMALL LETTER A +0062 LATIN SMALL LETTER B +0063 LATIN SMALL LETTER C +0064 LATIN SMALL LETTER D +0065 LATIN SMALL LETTER E + x (estimated symbol - 212E) + x (script small e - 212F) +0066 LATIN SMALL LETTER F +0067 LATIN SMALL LETTER G + x (latin small letter script g - 0261) + x (script small g - 210A) +0068 LATIN SMALL LETTER H + x (cyrillic small letter shha - 04BB) + x (planck constant - 210E) +0069 LATIN SMALL LETTER I + * Turkish and Azerbaijani use 0130 for uppercase + x (latin small letter dotless i - 0131) +006A LATIN SMALL LETTER J +006B LATIN SMALL LETTER K +006C LATIN SMALL LETTER L + x (script small l - 2113) +006D LATIN SMALL LETTER M +006E LATIN SMALL LETTER N + x (superscript latin small letter n - 207F) +006F LATIN SMALL LETTER O + x (script small o - 2134) +0070 LATIN SMALL LETTER P +0071 LATIN SMALL LETTER Q +0072 LATIN SMALL LETTER R +0073 LATIN SMALL LETTER S +0074 LATIN SMALL LETTER T +0075 LATIN SMALL LETTER U +0076 LATIN SMALL LETTER V +0077 LATIN SMALL LETTER W +0078 LATIN SMALL LETTER X +0079 LATIN SMALL LETTER Y +007A LATIN SMALL LETTER Z + x (latin small letter z with stroke - 01B6) +007B LEFT CURLY BRACKET + = OPENING CURLY BRACKET + = opening brace +007C VERTICAL LINE + = VERTICAL BAR + * used in pairs to indicate absolute value + x (latin letter dental click - 01C0) + x (hebrew punctuation paseq - 05C0) + x (divides - 2223) + x (light vertical bar - 2758) +007D RIGHT CURLY BRACKET + = CLOSING CURLY BRACKET + = closing brace +007E TILDE + * this is a spacing character + x (small tilde - 02DC) + x (combining tilde - 0303) + x (tilde operator - 223C) + x (fullwidth tilde - FF5E) +007F + = DELETE +@@ 0080 C1 Controls and Latin-1 Supplement (Latin-1 Supplement) 00FF +@ C1 controls +@+ Alias names are those for ISO 6429. +0080 +0081 +0082 + = BREAK PERMITTED HERE +0083 + = NO BREAK HERE +0084 +0085 + = NEXT LINE +0086 + = START OF SELECTED AREA +0087 + = END OF SELECTED AREA +0088 + = CHARACTER TABULATION SET +0089 + = CHARACTER TABULATION WITH JUSTIFICATION +008A + = LINE TABULATION SET +008B + = PARTIAL LINE DOWN +008C + = PARTIAL LINE UP +008D + = REVERSE LINE FEED +008E + = SINGLE SHIFT TWO +008F + = SINGLE SHIFT THREE +0090 + = DEVICE CONTROL STRING +0091 + = PRIVATE USE ONE +0092 + = PRIVATE USE TWO +0093 + = SET TRANSMIT STATE +0094 + = CANCEL CHARACTER +0095 + = MESSAGE WAITING +0096 + = START OF GUARDED AREA +0097 + = END OF GUARDED AREA +0098 + = START OF STRING +0099 +009A + = SINGLE CHARACTER INTRODUCER +009B + = CONTROL SEQUENCE INTRODUCER +009C + = STRING TERMINATOR +009D + = OPERATING SYSTEM COMMAND +009E + = PRIVACY MESSAGE +009F + = APPLICATION PROGRAM COMMAND +@ ISO 8859-1 (aka Latin-1) +00A0 NO-BREAK SPACE + x (space - 0020) + x (figure space - 2007) + x (narrow no-break space - 202F) + x (zero width no-break space - FEFF) + # 0020 +00A1 INVERTED EXCLAMATION MARK + * Spanish, Asturian, Galician + x (exclamation mark - 0021) +00A2 CENT SIGN +00A3 POUND SIGN + = pound sterling, Irish punt + x (lira sign - 20A4) +00A4 CURRENCY SIGN + = Filzlaus, Ricardi-Sonne (German names) + * other currency symbol characters: 20A0-20AF + x (dollar sign - 0024) +00A5 YEN SIGN + = yuan sign + * glyph may have one or two crossbars +00A6 BROKEN BAR + = BROKEN VERTICAL BAR + = parted rule (in typography) +00A7 SECTION SIGN + * paragraph sign in some European usage +00A8 DIAERESIS + * this is a spacing character + x (combining diaeresis - 0308) + # 0020 0308 +00A9 COPYRIGHT SIGN + x (sound recording copyright - 2117) +00AA FEMININE ORDINAL INDICATOR + * Spanish + # 0061 +00AB LEFT-POINTING DOUBLE ANGLE QUOTATION MARK * + = LEFT POINTING GUILLEMET + = chevrons (in typography) + * usually opening, sometimes closing + x (much less-than - 226A) + x (left double angle bracket - 300A) +00AC NOT SIGN + = angled dash (in typography) + x (reversed not sign - 2310) +00AD SOFT HYPHEN + = discretionary hyphen + x (mongolian todo soft hyphen - 1806) +00AE REGISTERED SIGN + = REGISTERED TRADE MARK SIGN +00AF MACRON + = overline, APL overbar + * this is a spacing character + x (modifier letter macron - 02C9) + x (combining macron - 0304) + x (combining overline - 0305) + # 0020 0304 +00B0 DEGREE SIGN + * this is a spacing character + x (ring above - 02DA) + x (combining ring above - 030A) + x (superscript zero - 2070) + x (ring operator - 2218) +00B1 PLUS-MINUS SIGN + x (minus-or-plus sign - 2213) +00B2 SUPERSCRIPT TWO + = squared + * other superscript digit characters: 2070-2079 + x (superscript one - 00B9) + # 0032 +00B3 SUPERSCRIPT THREE + = cubed + x (superscript one - 00B9) + # 0033 +00B4 ACUTE ACCENT + * this is a spacing character + x (modifier letter prime - 02B9) + x (modifier letter acute accent - 02CA) + x (combining acute accent - 0301) + x (prime - 2032) + # 0020 0301 +00B5 MICRO SIGN + # 03BC greek small letter mu +00B6 PILCROW SIGN + = PARAGRAPH SIGN + * section sign in some European usage + x (reversed pilcrow sign - 204B) + x (curved stem paragraph sign ornament - 2761) +00B7 MIDDLE DOT + = midpoint (in typography) + = Georgian comma + = Greek middle dot + x (bullet - 2022) + x (one dot leader - 2024) + x (hyphenation point - 2027) + x (bullet operator - 2219) + x (dot operator - 22C5) + x (katakana middle dot - 30FB) +00B8 CEDILLA + * this is a spacing character + * other spacing accent characters: 02D8-02DB + x (combining cedilla - 0327) + # 0020 0327 +00B9 SUPERSCRIPT ONE + x (superscript two - 00B2) + x (superscript three - 00B3) + # 0031 +00BA MASCULINE ORDINAL INDICATOR + * Spanish + # 006F +00BB RIGHT-POINTING DOUBLE ANGLE QUOTATION MARK * + = RIGHT POINTING GUILLEMET + * usually closing, sometimes opening + x (much greater-than - 226B) + x (right double angle bracket - 300B) +00BC VULGAR FRACTION ONE QUARTER + * bar may be horizontal or slanted + * other fraction characters: 2153-215E + # 0031 2044 0034 +00BD VULGAR FRACTION ONE HALF + * bar may be horizontal or slanted + # 0031 2044 0032 +00BE VULGAR FRACTION THREE QUARTERS + * bar may be horizontal or slanted + # 0033 2044 0034 +00BF INVERTED QUESTION MARK + = turned question mark + * Spanish + x (question mark - 003F) +00C0 LATIN CAPITAL LETTER A WITH GRAVE + : 0041 0300 +00C1 LATIN CAPITAL LETTER A WITH ACUTE + : 0041 0301 +00C2 LATIN CAPITAL LETTER A WITH CIRCUMFLEX + : 0041 0302 +00C3 LATIN CAPITAL LETTER A WITH TILDE + : 0041 0303 +00C4 LATIN CAPITAL LETTER A WITH DIAERESIS + : 0041 0308 +00C5 LATIN CAPITAL LETTER A WITH RING ABOVE + x (angstrom sign - 212B) + : 0041 030A +00C6 LATIN CAPITAL LETTER AE (ash) * + = LATIN CAPITAL LIGATURE AE +00C7 LATIN CAPITAL LETTER C WITH CEDILLA + : 0043 0327 +00C8 LATIN CAPITAL LETTER E WITH GRAVE + : 0045 0300 +00C9 LATIN CAPITAL LETTER E WITH ACUTE + : 0045 0301 +00CA LATIN CAPITAL LETTER E WITH CIRCUMFLEX + : 0045 0302 +00CB LATIN CAPITAL LETTER E WITH DIAERESIS + : 0045 0308 +00CC LATIN CAPITAL LETTER I WITH GRAVE + : 0049 0300 +00CD LATIN CAPITAL LETTER I WITH ACUTE + : 0049 0301 +00CE LATIN CAPITAL LETTER I WITH CIRCUMFLEX + : 0049 0302 +00CF LATIN CAPITAL LETTER I WITH DIAERESIS + : 0049 0308 +00D0 LATIN CAPITAL LETTER ETH (Icelandic) + x (latin small letter eth - 00F0) + x (latin capital letter d with stroke - 0110) + x (latin capital letter african d - 0189) +00D1 LATIN CAPITAL LETTER N WITH TILDE + : 004E 0303 +00D2 LATIN CAPITAL LETTER O WITH GRAVE + : 004F 0300 +00D3 LATIN CAPITAL LETTER O WITH ACUTE + : 004F 0301 +00D4 LATIN CAPITAL LETTER O WITH CIRCUMFLEX + : 004F 0302 +00D5 LATIN CAPITAL LETTER O WITH TILDE + : 004F 0303 +00D6 LATIN CAPITAL LETTER O WITH DIAERESIS + : 004F 0308 +00D7 MULTIPLICATION SIGN + = z notation Cartesian product +00D8 LATIN CAPITAL LETTER O WITH STROKE + = LATIN CAPITAL LETTER O SLASH + x (empty set - 2205) +00D9 LATIN CAPITAL LETTER U WITH GRAVE + : 0055 0300 +00DA LATIN CAPITAL LETTER U WITH ACUTE + : 0055 0301 +00DB LATIN CAPITAL LETTER U WITH CIRCUMFLEX + : 0055 0302 +00DC LATIN CAPITAL LETTER U WITH DIAERESIS + : 0055 0308 +00DD LATIN CAPITAL LETTER Y WITH ACUTE + : 0059 0301 +00DE LATIN CAPITAL LETTER THORN (Icelandic) +00DF LATIN SMALL LETTER SHARP S (German) + = Eszett + * German + * uppercase is "SS" + * in origin a ligature of 017F and 0073 + x (greek small letter beta - 03B2) +00E0 LATIN SMALL LETTER A WITH GRAVE + : 0061 0300 +00E1 LATIN SMALL LETTER A WITH ACUTE + : 0061 0301 +00E2 LATIN SMALL LETTER A WITH CIRCUMFLEX + : 0061 0302 +00E3 LATIN SMALL LETTER A WITH TILDE + * Portuguese + : 0061 0303 +00E4 LATIN SMALL LETTER A WITH DIAERESIS + : 0061 0308 +00E5 LATIN SMALL LETTER A WITH RING ABOVE + * Danish, Norwegian, Swedish, Walloon + : 0061 030A +00E6 LATIN SMALL LETTER AE (ash) * + = LATIN SMALL LIGATURE AE + = ash (from Old English æsc) + * Danish, Norwegian, Icelandic, Faroese, Old English, French, IPA + x (latin small ligature oe - 0153) + x (cyrillic small ligature a ie - 04D5) +00E7 LATIN SMALL LETTER C WITH CEDILLA + : 0063 0327 +00E8 LATIN SMALL LETTER E WITH GRAVE + : 0065 0300 +00E9 LATIN SMALL LETTER E WITH ACUTE + : 0065 0301 +00EA LATIN SMALL LETTER E WITH CIRCUMFLEX + : 0065 0302 +00EB LATIN SMALL LETTER E WITH DIAERESIS + : 0065 0308 +00EC LATIN SMALL LETTER I WITH GRAVE + * Italian, Malagasy + : 0069 0300 +00ED LATIN SMALL LETTER I WITH ACUTE + : 0069 0301 +00EE LATIN SMALL LETTER I WITH CIRCUMFLEX + : 0069 0302 +00EF LATIN SMALL LETTER I WITH DIAERESIS + : 0069 0308 +00F0 LATIN SMALL LETTER ETH (Icelandic) + * Icelandic, Faroese, Old English, IPA + x (latin capital letter eth - 00D0) + x (greek small letter delta - 03B4) + x (partial differential - 2202) +00F1 LATIN SMALL LETTER N WITH TILDE + : 006E 0303 +00F2 LATIN SMALL LETTER O WITH GRAVE + : 006F 0300 +00F3 LATIN SMALL LETTER O WITH ACUTE + : 006F 0301 +00F4 LATIN SMALL LETTER O WITH CIRCUMFLEX + : 006F 0302 +00F5 LATIN SMALL LETTER O WITH TILDE + * Portuguese, Estonian + : 006F 0303 +00F6 LATIN SMALL LETTER O WITH DIAERESIS + : 006F 0308 +00F7 DIVISION SIGN +00F8 LATIN SMALL LETTER O WITH STROKE + = LATIN SMALL LETTER O SLASH + * Danish, Norwegian, Faroese, IPA +00F9 LATIN SMALL LETTER U WITH GRAVE + * French, Italian + : 0075 0300 +00FA LATIN SMALL LETTER U WITH ACUTE + : 0075 0301 +00FB LATIN SMALL LETTER U WITH CIRCUMFLEX + : 0075 0302 +00FC LATIN SMALL LETTER U WITH DIAERESIS + : 0075 0308 +00FD LATIN SMALL LETTER Y WITH ACUTE + * Czech, Slovak, Icelandic, Faroese, Welsh, Malagasy + : 0079 0301 +00FE LATIN SMALL LETTER THORN (Icelandic) + * Icelandic, Old English, phonetics + * Runic letter borrowed into Latin script + x (runic letter thurisaz thurs thorn - 16A6) +00FF LATIN SMALL LETTER Y WITH DIAERESIS + * French + x (latin capital letter y with diaeresis - 0178) + : 0079 0308 +@@ 0100 Latin Extended-A 017F +@ European Latin +0100 LATIN CAPITAL LETTER A WITH MACRON + : 0041 0304 +0101 LATIN SMALL LETTER A WITH MACRON + * Latvian, Latin, ... + : 0061 0304 +0102 LATIN CAPITAL LETTER A WITH BREVE + : 0041 0306 +0103 LATIN SMALL LETTER A WITH BREVE + * Romanian, Vietnamese, Latin, ... + : 0061 0306 +0104 LATIN CAPITAL LETTER A WITH OGONEK + : 0041 0328 +0105 LATIN SMALL LETTER A WITH OGONEK + * Polish, Lithuanian, ... + : 0061 0328 +0106 LATIN CAPITAL LETTER C WITH ACUTE + : 0043 0301 +0107 LATIN SMALL LETTER C WITH ACUTE + * Polish, Croatian, ... + x (cyrillic small letter tshe - 045B) + : 0063 0301 +0108 LATIN CAPITAL LETTER C WITH CIRCUMFLEX + : 0043 0302 +0109 LATIN SMALL LETTER C WITH CIRCUMFLEX + * Esperanto + : 0063 0302 +010A LATIN CAPITAL LETTER C WITH DOT ABOVE + : 0043 0307 +010B LATIN SMALL LETTER C WITH DOT ABOVE + * Maltese, Irish Gaelic (old orthography) + : 0063 0307 +010C LATIN CAPITAL LETTER C WITH CARON + : 0043 030C +010D LATIN SMALL LETTER C WITH CARON + * Czech, Slovak, Slovenian, and many other languages + : 0063 030C +010E LATIN CAPITAL LETTER D WITH CARON + * the form using caron/hacek is preferred in all contexts + : 0044 030C +010F LATIN SMALL LETTER D WITH CARON + * Czech, Slovak + * the form using apostrophe is preferred in typesetting + : 0064 030C +0110 LATIN CAPITAL LETTER D WITH STROKE + x (latin capital letter eth - 00D0) + x (latin small letter d with stroke - 0111) + x (latin capital letter african d - 0189) +0111 LATIN SMALL LETTER D WITH STROKE + * Croatian, Vietnamese, Sámi + x (latin capital letter d with stroke - 0110) + x (cyrillic small letter dje - 0452) +0112 LATIN CAPITAL LETTER E WITH MACRON + : 0045 0304 +0113 LATIN SMALL LETTER E WITH MACRON + * Latvian, Latin, ... + : 0065 0304 +0114 LATIN CAPITAL LETTER E WITH BREVE + : 0045 0306 +0115 LATIN SMALL LETTER E WITH BREVE + * Malay, Latin, ... + : 0065 0306 +0116 LATIN CAPITAL LETTER E WITH DOT ABOVE + : 0045 0307 +0117 LATIN SMALL LETTER E WITH DOT ABOVE + * Lithuanian + : 0065 0307 +0118 LATIN CAPITAL LETTER E WITH OGONEK + : 0045 0328 +0119 LATIN SMALL LETTER E WITH OGONEK + * Polish, Lithuanian, ... + : 0065 0328 +011A LATIN CAPITAL LETTER E WITH CARON + : 0045 030C +011B LATIN SMALL LETTER E WITH CARON + * Czech, ... + : 0065 030C +011C LATIN CAPITAL LETTER G WITH CIRCUMFLEX + : 0047 0302 +011D LATIN SMALL LETTER G WITH CIRCUMFLEX + * Esperanto + : 0067 0302 +011E LATIN CAPITAL LETTER G WITH BREVE + : 0047 0306 +011F LATIN SMALL LETTER G WITH BREVE + * Turkish, Azerbaijani + x (latin small letter g with caron - 01E7) + : 0067 0306 +0120 LATIN CAPITAL LETTER G WITH DOT ABOVE + : 0047 0307 +0121 LATIN SMALL LETTER G WITH DOT ABOVE + * Maltese, Irish Gaelic (old orthography) + : 0067 0307 +0122 LATIN CAPITAL LETTER G WITH CEDILLA + : 0047 0327 +0123 LATIN SMALL LETTER G WITH CEDILLA + * Latvian + * there are three major glyph variants + : 0067 0327 +0124 LATIN CAPITAL LETTER H WITH CIRCUMFLEX + : 0048 0302 +0125 LATIN SMALL LETTER H WITH CIRCUMFLEX + * Esperanto + : 0068 0302 +0126 LATIN CAPITAL LETTER H WITH STROKE +0127 LATIN SMALL LETTER H WITH STROKE + * Maltese, IPA, ... + x (cyrillic small letter tshe - 045B) + x (planck constant over two pi - 210F) +0128 LATIN CAPITAL LETTER I WITH TILDE + : 0049 0303 +0129 LATIN SMALL LETTER I WITH TILDE + * Greenlandic (old orthography) + : 0069 0303 +012A LATIN CAPITAL LETTER I WITH MACRON + : 0049 0304 +012B LATIN SMALL LETTER I WITH MACRON + * Latvian, Latin, ... + : 0069 0304 +012C LATIN CAPITAL LETTER I WITH BREVE + : 0049 0306 +012D LATIN SMALL LETTER I WITH BREVE + * Latin, ... + : 0069 0306 +012E LATIN CAPITAL LETTER I WITH OGONEK + : 0049 0328 +012F LATIN SMALL LETTER I WITH OGONEK + * Lithuanian, ... + : 0069 0328 +0130 LATIN CAPITAL LETTER I WITH DOT ABOVE + = LATIN CAPITAL LETTER I DOT + * Turkish, Azerbaijani + * lowercase is 0069 + x (latin capital letter i - 0049) + : 0049 0307 +0131 LATIN SMALL LETTER DOTLESS I + * Turkish, Azerbaijani + * uppercase is 0049 + x (latin small letter i - 0069) +0132 LATIN CAPITAL LIGATURE IJ + # 0049 004A +0133 LATIN SMALL LIGATURE IJ + * Dutch + # 0069 006A +0134 LATIN CAPITAL LETTER J WITH CIRCUMFLEX + : 004A 0302 +0135 LATIN SMALL LETTER J WITH CIRCUMFLEX + * Esperanto + : 006A 0302 +0136 LATIN CAPITAL LETTER K WITH CEDILLA + : 004B 0327 +0137 LATIN SMALL LETTER K WITH CEDILLA + * Latvian + : 006B 0327 +0138 LATIN SMALL LETTER KRA (Greenlandic) + * Greenlandic (old orthography) +0139 LATIN CAPITAL LETTER L WITH ACUTE + : 004C 0301 +013A LATIN SMALL LETTER L WITH ACUTE + * Slovak + : 006C 0301 +013B LATIN CAPITAL LETTER L WITH CEDILLA + : 004C 0327 +013C LATIN SMALL LETTER L WITH CEDILLA + * Latvian + : 006C 0327 +013D LATIN CAPITAL LETTER L WITH CARON + : 004C 030C +013E LATIN SMALL LETTER L WITH CARON + * Slovak + * the form using apostrophe is preferred in typesetting + : 006C 030C +013F LATIN CAPITAL LETTER L WITH MIDDLE DOT + * some fonts show the middle dot inside the L, but the preferred form has the dot following the L + # 004C 00B7 +0140 LATIN SMALL LETTER L WITH MIDDLE DOT + * Catalan + # 006C 00B7 +0141 LATIN CAPITAL LETTER L WITH STROKE +0142 LATIN SMALL LETTER L WITH STROKE + * Polish, ... + x (latin small letter l with bar - 019A) +0143 LATIN CAPITAL LETTER N WITH ACUTE + : 004E 0301 +0144 LATIN SMALL LETTER N WITH ACUTE + * Polish, ... + : 006E 0301 +0145 LATIN CAPITAL LETTER N WITH CEDILLA + : 004E 0327 +0146 LATIN SMALL LETTER N WITH CEDILLA + * Latvian + : 006E 0327 +0147 LATIN CAPITAL LETTER N WITH CARON + : 004E 030C +0148 LATIN SMALL LETTER N WITH CARON + * Czech, Slovak + : 006E 030C +0149 LATIN SMALL LETTER N PRECEDED BY APOSTROPHE + = LATIN SMALL LETTER APOSTROPHE N + * Afrikaans + * this is not actually a single letter + # 02BC 006E +014A LATIN CAPITAL LETTER ENG (Sami) + * glyph may also have appearance of large form of the small letter +014B LATIN SMALL LETTER ENG (Sami) + * Sámi, Mende, IPA, ... +014C LATIN CAPITAL LETTER O WITH MACRON + : 004F 0304 +014D LATIN SMALL LETTER O WITH MACRON + * Latvian, Latin, ... + : 006F 0304 +014E LATIN CAPITAL LETTER O WITH BREVE + : 004F 0306 +014F LATIN SMALL LETTER O WITH BREVE + * Latin + : 006F 0306 +0150 LATIN CAPITAL LETTER O WITH DOUBLE ACUTE + : 004F 030B +0151 LATIN SMALL LETTER O WITH DOUBLE ACUTE + * Hungarian + : 006F 030B +0152 LATIN CAPITAL LIGATURE OE +0153 LATIN SMALL LIGATURE OE + = LATIN SMALL LETTER O E + = ethel (from Old English eðel) + * French, IPA, Old Icelandic, Old English, ... + x (latin small letter ae - 00E6) + x (latin letter small capital oe - 0276) +0154 LATIN CAPITAL LETTER R WITH ACUTE + : 0052 0301 +0155 LATIN SMALL LETTER R WITH ACUTE + * Slovak, ... + : 0072 0301 +0156 LATIN CAPITAL LETTER R WITH CEDILLA + : 0052 0327 +0157 LATIN SMALL LETTER R WITH CEDILLA + * Latvian + : 0072 0327 +0158 LATIN CAPITAL LETTER R WITH CARON + : 0052 030C +0159 LATIN SMALL LETTER R WITH CARON + * Czech, ... + : 0072 030C +015A LATIN CAPITAL LETTER S WITH ACUTE + : 0053 0301 +015B LATIN SMALL LETTER S WITH ACUTE + * Polish, Indic transliteration, ... + : 0073 0301 +015C LATIN CAPITAL LETTER S WITH CIRCUMFLEX + : 0053 0302 +015D LATIN SMALL LETTER S WITH CIRCUMFLEX + * Esperanto + : 0073 0302 +015E LATIN CAPITAL LETTER S WITH CEDILLA * + : 0053 0327 +015F LATIN SMALL LETTER S WITH CEDILLA * + * Turkish, Azerbaijani, Romanian, ... + * this character is used in both Turkish and Romanian data + * a glyph variant with comma below is preferred for Romanian + x (latin small letter s with comma below - 0219) + : 0073 0327 +0160 LATIN CAPITAL LETTER S WITH CARON + : 0053 030C +0161 LATIN SMALL LETTER S WITH CARON + * Czech, Estonian, Finnish, Slovak, and many other languages + : 0073 030C +0162 LATIN CAPITAL LETTER T WITH CEDILLA * + : 0054 0327 +0163 LATIN SMALL LETTER T WITH CEDILLA * + * Romanian, Semitic transliteration, ... + * this character is used in Romanian data + * a glyph variant with comma below is preferred for Romanian + x (latin small letter t with comma below - 021B) + : 0074 0327 +0164 LATIN CAPITAL LETTER T WITH CARON + * the form using caron/hacek is preferred in all contexts + : 0054 030C +0165 LATIN SMALL LETTER T WITH CARON + * Czech, Slovak + * the form using apostrophe is preferred in typesetting + : 0074 030C +0166 LATIN CAPITAL LETTER T WITH STROKE +0167 LATIN SMALL LETTER T WITH STROKE + * Sámi +0168 LATIN CAPITAL LETTER U WITH TILDE + : 0055 0303 +0169 LATIN SMALL LETTER U WITH TILDE + * Greenlandic (old orthography) + : 0075 0303 +016A LATIN CAPITAL LETTER U WITH MACRON + : 0055 0304 +016B LATIN SMALL LETTER U WITH MACRON + * Latvian, Lithuanian, Latin, ... + : 0075 0304 +016C LATIN CAPITAL LETTER U WITH BREVE + : 0055 0306 +016D LATIN SMALL LETTER U WITH BREVE + * Latin, Esperanto, ... + : 0075 0306 +016E LATIN CAPITAL LETTER U WITH RING ABOVE + : 0055 030A +016F LATIN SMALL LETTER U WITH RING ABOVE + * Czech, ... + : 0075 030A +0170 LATIN CAPITAL LETTER U WITH DOUBLE ACUTE + : 0055 030B +0171 LATIN SMALL LETTER U WITH DOUBLE ACUTE + * Hungarian + : 0075 030B +0172 LATIN CAPITAL LETTER U WITH OGONEK + : 0055 0328 +0173 LATIN SMALL LETTER U WITH OGONEK + * Lithuanian + : 0075 0328 +0174 LATIN CAPITAL LETTER W WITH CIRCUMFLEX + : 0057 0302 +0175 LATIN SMALL LETTER W WITH CIRCUMFLEX + * Welsh + : 0077 0302 +0176 LATIN CAPITAL LETTER Y WITH CIRCUMFLEX + : 0059 0302 +0177 LATIN SMALL LETTER Y WITH CIRCUMFLEX + * Welsh + : 0079 0302 +0178 LATIN CAPITAL LETTER Y WITH DIAERESIS + * French, Igbo + x (latin small letter y with diaeresis - 00FF) + : 0059 0308 +0179 LATIN CAPITAL LETTER Z WITH ACUTE + : 005A 0301 +017A LATIN SMALL LETTER Z WITH ACUTE + * Polish, ... + : 007A 0301 +017B LATIN CAPITAL LETTER Z WITH DOT ABOVE + : 005A 0307 +017C LATIN SMALL LETTER Z WITH DOT ABOVE + * Polish, ... + : 007A 0307 +017D LATIN CAPITAL LETTER Z WITH CARON + : 005A 030C +017E LATIN SMALL LETTER Z WITH CARON + * Czech, Estonian, Finnish, Slovak, Slovenian, and many other languages + : 007A 030C +017F LATIN SMALL LETTER LONG S + * in common use in Roman types until the 18th century + * in current use in Fraktur and Gaelic types + # 0073 latin small letter s +@@ 0180 Latin Extended-B 024F +@ Latin extended-B +0180 LATIN SMALL LETTER B WITH STROKE + * Americanist and Indo-Europeanist usage for phonetic beta + * Old Saxon + x (greek small letter beta - 03B2) + x (blank symbol - 2422) +0181 LATIN CAPITAL LETTER B WITH HOOK + * Zulu, Pan-Nigerian alphabet + x (latin small letter b with hook - 0253) +0182 LATIN CAPITAL LETTER B WITH TOPBAR +0183 LATIN SMALL LETTER B WITH TOPBAR + * Zhuang + * former Soviet minority language scripts + x (cyrillic capital letter be - 0411) +0184 LATIN CAPITAL LETTER TONE SIX +0185 LATIN SMALL LETTER TONE SIX + * Zhuang + * Zhuang tone three is Cyrillic ze + * Zhuang tone four is Cyrillic che + x (latin small letter tone two - 01A8) + x (latin small letter tone five - 01BD) + x (cyrillic small letter ze - 0437) + x (cyrillic small letter che - 0447) + x (cyrillic small letter soft sign - 044C) +0186 LATIN CAPITAL LETTER OPEN O + * typographically a turned C + x (latin small letter open o - 0254) +0187 LATIN CAPITAL LETTER C WITH HOOK +0188 LATIN SMALL LETTER C WITH HOOK + * African +0189 LATIN CAPITAL LETTER AFRICAN D * + * Ewe + x (latin capital letter eth - 00D0) + x (latin capital letter d with stroke - 0110) + x (latin small letter d with tail - 0256) +018A LATIN CAPITAL LETTER D WITH HOOK + * Pan-Nigerian alphabet + x (latin small letter d with hook - 0257) +018B LATIN CAPITAL LETTER D WITH TOPBAR +018C LATIN SMALL LETTER D WITH TOPBAR + * former-Soviet minority language scripts +018D LATIN SMALL LETTER TURNED DELTA + * archaic phonetic for labialized dental fricative + * recommended spellings 007A 02B7 or 007A 032B +018E LATIN CAPITAL LETTER REVERSED E + = LATIN CAPITAL LETTER TURNED E + * Pan-Nigerian alphabet + * lowercase is 01DD +018F LATIN CAPITAL LETTER SCHWA + * Azerbaijani, ... + x (latin small letter schwa - 0259) + x (cyrillic capital letter schwa - 04D8) +0190 LATIN CAPITAL LETTER OPEN E + = LATIN CAPITAL LETTER EPSILON + * African + x (latin small letter open e - 025B) + x (euler constant - 2107) +0191 LATIN CAPITAL LETTER F WITH HOOK + * African +0192 LATIN SMALL LETTER F WITH HOOK + = LATIN SMALL LETTER SCRIPT F + = Florin currency symbol (Netherlands) + = function symbol + = abbreviation convention for folder +0193 LATIN CAPITAL LETTER G WITH HOOK + * African + x (latin small letter g with hook - 0260) +0194 LATIN CAPITAL LETTER GAMMA + * African + x (latin small letter gamma - 0263) +0195 LATIN SMALL LETTER HV (hwair) + * Gothic transliteration + * uppercase is 01F6 +0196 LATIN CAPITAL LETTER IOTA + * African + x (latin small letter iota - 0269) +0197 LATIN CAPITAL LETTER I WITH STROKE + = barred i, i bar + * African + * ISO 6438 gives lowercase as 026A, not 0268 + x (latin letter small capital i - 026A) +0198 LATIN CAPITAL LETTER K WITH HOOK +0199 LATIN SMALL LETTER K WITH HOOK + * Hausa, Pan-Nigerian alphabet +019A LATIN SMALL LETTER L WITH BAR + = barred l + * Americanist phonetic usage for 026C + x (latin small letter l with stroke - 0142) +019B LATIN SMALL LETTER LAMBDA WITH STROKE + = barred lambda, lambda bar + * Americanist phonetic usage +019C LATIN CAPITAL LETTER TURNED M + * Zhuang + x (latin small letter turned m - 026F) +019D LATIN CAPITAL LETTER N WITH LEFT HOOK + * African + x (latin small letter n with left hook - 0272) +019E LATIN SMALL LETTER N WITH LONG RIGHT LEG + * archaic phonetic for Japanese syllabic "n" + * recommended spelling 006E 0329 +019F LATIN CAPITAL LETTER O WITH MIDDLE TILDE * + = barred o, o bar + * lowercase is 0275 + * African + x (cyrillic capital letter barred o - 04E8) +01A0 LATIN CAPITAL LETTER O WITH HORN + : 004F 031B +01A1 LATIN SMALL LETTER O WITH HORN + * Vietnamese + : 006F 031B +01A2 LATIN CAPITAL LETTER OI (gha) +01A3 LATIN SMALL LETTER OI (gha) + = gha + * Pan-Turkic Latin alphabets +01A4 LATIN CAPITAL LETTER P WITH HOOK +01A5 LATIN SMALL LETTER P WITH HOOK + * African +01A6 LATIN LETTER YR * + * old Norse + * from German Standard DIN 31624 and ISO 5246-2 + * lowercase is 0280 +01A7 LATIN CAPITAL LETTER TONE TWO +01A8 LATIN SMALL LETTER TONE TWO + * Zhuang + * typographically a reversed S + x (latin small letter tone six - 0185) +01A9 LATIN CAPITAL LETTER ESH + * African + x (latin small letter esh - 0283) + x (greek capital letter sigma - 03A3) +01AA LATIN LETTER REVERSED ESH LOOP + * archaic phonetic for labialized palatoalveolar or palatal fricative + * Twi + * recommended spellings 0283 02B7, 00E7 02B7, 0068 0265, etc. +01AB LATIN SMALL LETTER T WITH PALATAL HOOK + * archaic phonetic for palatalized alveolar or dental stop + * recommended spelling 0074 02B2 +01AC LATIN CAPITAL LETTER T WITH HOOK +01AD LATIN SMALL LETTER T WITH HOOK + * African +01AE LATIN CAPITAL LETTER T WITH RETROFLEX HOOK + * African + x (latin small letter t with retroflex hook - 0288) +01AF LATIN CAPITAL LETTER U WITH HORN + : 0055 031B +01B0 LATIN SMALL LETTER U WITH HORN + * Vietnamese + : 0075 031B +01B1 LATIN CAPITAL LETTER UPSILON + * African + * typographically based on turned capital Greek omega + x (latin small letter upsilon - 028A) + x (inverted ohm sign - 2127) +01B2 LATIN CAPITAL LETTER V WITH HOOK + = LATIN CAPITAL LETTER SCRIPT V + * African + x (latin small letter v with hook - 028B) +01B3 LATIN CAPITAL LETTER Y WITH HOOK +01B4 LATIN SMALL LETTER Y WITH HOOK + * Bini, Esoko, and other Edo languages in West Africa +01B5 LATIN CAPITAL LETTER Z WITH STROKE +01B6 LATIN SMALL LETTER Z WITH STROKE + = barred z, z bar + * Pan-Turkic Latin orthography + * handwritten variant of Latin "z" + x (latin small letter z - 007A) +01B7 LATIN CAPITAL LETTER EZH + * African, Skolt Sámi + * lowercase is 0292 + x (latin capital letter yogh - 021C) + x (cyrillic capital letter abkhasian dze - 04E0) +01B8 LATIN CAPITAL LETTER EZH REVERSED +01B9 LATIN SMALL LETTER EZH REVERSED + * archaic phonetic for voiced pharyngeal fricative + * sometimes typographically rendered with a turned digit 3 + * recommended spelling 0295 + x (latin letter pharyngeal voiced fricative - 0295) + x (arabic letter ain - 0639) +01BA LATIN SMALL LETTER EZH WITH TAIL + * archaic phonetic for labialized voiced palatoalveolar or palatal fricative + * Twi + * recommended spellings 0292 02B7 or 006A 02B7 +01BB LATIN LETTER TWO WITH STROKE + * archaic phonetic for [dz] affricate + * recommended spellings 0292 or 0064 007A +01BC LATIN CAPITAL LETTER TONE FIVE +01BD LATIN SMALL LETTER TONE FIVE + * Zhuang + x (latin small letter tone six - 0185) +01BE LATIN LETTER INVERTED GLOTTAL STOP WITH STROKE + * archaic phonetic for [ts] affricate + * recommended spelling 0074 0073 + * letter form is actually derived from ligation of ts, rather than inverted glottal stop +01BF LATIN LETTER WYNN + = wen + * Runic letter borrowed into Latin script + * replaced by "w" in modern transcriptions of Old English + * uppercase is 01F7 + x (runic letter wunjo wynn w - 16B9) +01C0 LATIN LETTER DENTAL CLICK + = pipe + * Khoisan tradition + * "c" in Zulu orthography + x (solidus - 002F) + x (vertical line - 007C) + x (latin small letter turned t - 0287) + x (divides - 2223) +01C1 LATIN LETTER LATERAL CLICK + = double pipe + * Khoisan tradition + * "x" in Zulu orthography + x (latin letter inverted glottal stop - 0296) + x (parallel to - 2225) +01C2 LATIN LETTER ALVEOLAR CLICK + = double-barred pipe + * Khoisan tradition + x (not equal to - 2260) +01C3 LATIN LETTER RETROFLEX CLICK + = LATIN LETTER EXCLAMATION MARK + * Khoisan tradition + * "q" in Zulu orthography + x (exclamation mark - 0021) + x (latin letter stretched c - 0297) +@ Croatian digraphs matching Serbian Cyrillic letters +01C4 LATIN CAPITAL LETTER DZ WITH CARON + # 0044 017D +01C5 LATIN CAPITAL LETTER D WITH SMALL LETTER Z WITH CARON + # 0044 017E +01C6 LATIN SMALL LETTER DZ WITH CARON + x (cyrillic small letter dzhe - 045F) + # 0064 017E +01C7 LATIN CAPITAL LETTER LJ + # 004C 004A +01C8 LATIN CAPITAL LETTER L WITH SMALL LETTER J + # 004C 006A +01C9 LATIN SMALL LETTER LJ + x (cyrillic small letter lje - 0459) + # 006C 006A +01CA LATIN CAPITAL LETTER NJ + # 004E 004A +01CB LATIN CAPITAL LETTER N WITH SMALL LETTER J + # 004E 006A +01CC LATIN SMALL LETTER NJ + x (cyrillic small letter nje - 045A) + # 006E 006A +@ Pinyin diacritic-vowel combinations +01CD LATIN CAPITAL LETTER A WITH CARON + : 0041 030C +01CE LATIN SMALL LETTER A WITH CARON + * Pinyin third tone + : 0061 030C +01CF LATIN CAPITAL LETTER I WITH CARON + : 0049 030C +01D0 LATIN SMALL LETTER I WITH CARON + * Pinyin third tone + : 0069 030C +01D1 LATIN CAPITAL LETTER O WITH CARON + : 004F 030C +01D2 LATIN SMALL LETTER O WITH CARON + * Pinyin third tone + : 006F 030C +01D3 LATIN CAPITAL LETTER U WITH CARON + : 0055 030C +01D4 LATIN SMALL LETTER U WITH CARON + * Pinyin third tone + : 0075 030C +01D5 LATIN CAPITAL LETTER U WITH DIAERESIS AND MACRON + : 00DC 0304 +01D6 LATIN SMALL LETTER U WITH DIAERESIS AND MACRON + * Pinyin first tone + : 00FC 0304 +01D7 LATIN CAPITAL LETTER U WITH DIAERESIS AND ACUTE + : 00DC 0301 +01D8 LATIN SMALL LETTER U WITH DIAERESIS AND ACUTE + * Pinyin second tone + : 00FC 0301 +01D9 LATIN CAPITAL LETTER U WITH DIAERESIS AND CARON + : 00DC 030C +01DA LATIN SMALL LETTER U WITH DIAERESIS AND CARON + * Pinyin third tone + : 00FC 030C +01DB LATIN CAPITAL LETTER U WITH DIAERESIS AND GRAVE + : 00DC 0300 +01DC LATIN SMALL LETTER U WITH DIAERESIS AND GRAVE + * Pinyin fourth tone + : 00FC 0300 +@ Additions +01DD LATIN SMALL LETTER TURNED E + * Pan-Nigerian alphabet + * all other usages of schwa are 0259 + * uppercase is 018E + x (latin small letter schwa - 0259) +01DE LATIN CAPITAL LETTER A WITH DIAERESIS AND MACRON + : 00C4 0304 +01DF LATIN SMALL LETTER A WITH DIAERESIS AND MACRON + * Livonian, Uralicist usage + : 00E4 0304 +01E0 LATIN CAPITAL LETTER A WITH DOT ABOVE AND MACRON + : 0226 0304 +01E1 LATIN SMALL LETTER A WITH DOT ABOVE AND MACRON + * Uralicist usage + : 0227 0304 +01E2 LATIN CAPITAL LETTER AE WITH MACRON (ash) * + : 00C6 0304 +01E3 LATIN SMALL LETTER AE WITH MACRON (ash) * + * Old Norse, Old English + : 00E6 0304 +01E4 LATIN CAPITAL LETTER G WITH STROKE +01E5 LATIN SMALL LETTER G WITH STROKE + * Skolt Sámi +01E6 LATIN CAPITAL LETTER G WITH CARON + : 0047 030C +01E7 LATIN SMALL LETTER G WITH CARON + * Skolt Sámi + x (latin small letter g with breve - 011F) + : 0067 030C +01E8 LATIN CAPITAL LETTER K WITH CARON + : 004B 030C +01E9 LATIN SMALL LETTER K WITH CARON + * Skolt Sámi + : 006B 030C +01EA LATIN CAPITAL LETTER O WITH OGONEK + : 004F 0328 +01EB LATIN SMALL LETTER O WITH OGONEK + * Sámi, Iroquoian, Old Icelandic + : 006F 0328 +01EC LATIN CAPITAL LETTER O WITH OGONEK AND MACRON + : 01EA 0304 +01ED LATIN SMALL LETTER O WITH OGONEK AND MACRON + * Old Icelandic + : 01EB 0304 +01EE LATIN CAPITAL LETTER EZH WITH CARON + : 01B7 030C +01EF LATIN SMALL LETTER EZH WITH CARON + * Skolt Sámi + : 0292 030C +01F0 LATIN SMALL LETTER J WITH CARON + * IPA and many languages + : 006A 030C +01F1 LATIN CAPITAL LETTER DZ + # 0044 005A +01F2 LATIN CAPITAL LETTER D WITH SMALL LETTER Z + # 0044 007A +01F3 LATIN SMALL LETTER DZ + # 0064 007A +01F4 LATIN CAPITAL LETTER G WITH ACUTE + : 0047 0301 +01F5 LATIN SMALL LETTER G WITH ACUTE + * Macedonian and Serbian transliteration + : 0067 0301 +01F6 LATIN CAPITAL LETTER HWAIR + * lowercase is 0195 +01F7 LATIN CAPITAL LETTER WYNN + = wen + * lowercase is 01BF +01F8 LATIN CAPITAL LETTER N WITH GRAVE + : 004E 0300 +01F9 LATIN SMALL LETTER N WITH GRAVE + * Pinyin + : 006E 0300 +01FA LATIN CAPITAL LETTER A WITH RING ABOVE AND ACUTE + : 00C5 0301 +01FB LATIN SMALL LETTER A WITH RING ABOVE AND ACUTE + : 00E5 0301 +01FC LATIN CAPITAL LETTER AE WITH ACUTE (ash) * + : 00C6 0301 +01FD LATIN SMALL LETTER AE WITH ACUTE (ash) * + : 00E6 0301 +01FE LATIN CAPITAL LETTER O WITH STROKE AND ACUTE + : 00D8 0301 +01FF LATIN SMALL LETTER O WITH STROKE AND ACUTE + : 00F8 0301 +@ Additions for Slovenian and Croatian +0200 LATIN CAPITAL LETTER A WITH DOUBLE GRAVE + : 0041 030F +0201 LATIN SMALL LETTER A WITH DOUBLE GRAVE + : 0061 030F +0202 LATIN CAPITAL LETTER A WITH INVERTED BREVE + : 0041 0311 +0203 LATIN SMALL LETTER A WITH INVERTED BREVE + : 0061 0311 +0204 LATIN CAPITAL LETTER E WITH DOUBLE GRAVE + : 0045 030F +0205 LATIN SMALL LETTER E WITH DOUBLE GRAVE + : 0065 030F +0206 LATIN CAPITAL LETTER E WITH INVERTED BREVE + : 0045 0311 +0207 LATIN SMALL LETTER E WITH INVERTED BREVE + : 0065 0311 +0208 LATIN CAPITAL LETTER I WITH DOUBLE GRAVE + : 0049 030F +0209 LATIN SMALL LETTER I WITH DOUBLE GRAVE + : 0069 030F +020A LATIN CAPITAL LETTER I WITH INVERTED BREVE + : 0049 0311 +020B LATIN SMALL LETTER I WITH INVERTED BREVE + : 0069 0311 +020C LATIN CAPITAL LETTER O WITH DOUBLE GRAVE + : 004F 030F +020D LATIN SMALL LETTER O WITH DOUBLE GRAVE + : 006F 030F +020E LATIN CAPITAL LETTER O WITH INVERTED BREVE + : 004F 0311 +020F LATIN SMALL LETTER O WITH INVERTED BREVE + : 006F 0311 +0210 LATIN CAPITAL LETTER R WITH DOUBLE GRAVE + : 0052 030F +0211 LATIN SMALL LETTER R WITH DOUBLE GRAVE + : 0072 030F +0212 LATIN CAPITAL LETTER R WITH INVERTED BREVE + : 0052 0311 +0213 LATIN SMALL LETTER R WITH INVERTED BREVE + : 0072 0311 +0214 LATIN CAPITAL LETTER U WITH DOUBLE GRAVE + : 0055 030F +0215 LATIN SMALL LETTER U WITH DOUBLE GRAVE + : 0075 030F +0216 LATIN CAPITAL LETTER U WITH INVERTED BREVE + : 0055 0311 +0217 LATIN SMALL LETTER U WITH INVERTED BREVE + : 0075 0311 +@ Additions for Romanian +0218 LATIN CAPITAL LETTER S WITH COMMA BELOW * + : 0053 0326 +0219 LATIN SMALL LETTER S WITH COMMA BELOW * + * Romanian, when distinct comma below form is required + x (latin small letter s with cedilla - 015F) + : 0073 0326 +021A LATIN CAPITAL LETTER T WITH COMMA BELOW * + : 0054 0326 +021B LATIN SMALL LETTER T WITH COMMA BELOW * + * Romanian, when distinct comma below form is required + x (latin small letter t with cedilla - 0163) + : 0074 0326 +@ Miscellaneous additions +021C LATIN CAPITAL LETTER YOGH + x (latin capital letter ezh - 01B7) +021D LATIN SMALL LETTER YOGH + * Middle English, Scots + x (latin small letter ezh - 0292) + x (ounce sign - 2125) +021E LATIN CAPITAL LETTER H WITH CARON + : 0048 030C +021F LATIN SMALL LETTER H WITH CARON + * Finnish Romany + : 0068 030C +0222 LATIN CAPITAL LETTER OU +0223 LATIN SMALL LETTER OU + * Algonquin, Huron + x (digit eight - 0038) +0224 LATIN CAPITAL LETTER Z WITH HOOK +0225 LATIN SMALL LETTER Z WITH HOOK + * Middle High German +0226 LATIN CAPITAL LETTER A WITH DOT ABOVE + : 0041 0307 +0227 LATIN SMALL LETTER A WITH DOT ABOVE + * Uralicist usage + : 0061 0307 +0228 LATIN CAPITAL LETTER E WITH CEDILLA + : 0045 0327 +0229 LATIN SMALL LETTER E WITH CEDILLA + : 0065 0327 +@ Additions for Livonian +022A LATIN CAPITAL LETTER O WITH DIAERESIS AND MACRON + : 00D6 0304 +022B LATIN SMALL LETTER O WITH DIAERESIS AND MACRON + * Livonian + : 00F6 0304 +022C LATIN CAPITAL LETTER O WITH TILDE AND MACRON + : 00D5 0304 +022D LATIN SMALL LETTER O WITH TILDE AND MACRON + * Livonian + : 00F5 0304 +022E LATIN CAPITAL LETTER O WITH DOT ABOVE + : 004F 0307 +022F LATIN SMALL LETTER O WITH DOT ABOVE + * Livonian + : 006F 0307 +0230 LATIN CAPITAL LETTER O WITH DOT ABOVE AND MACRON + : 022E 0304 +0231 LATIN SMALL LETTER O WITH DOT ABOVE AND MACRON + * Livonian + : 022F 0304 +0232 LATIN CAPITAL LETTER Y WITH MACRON + : 0059 0304 +0233 LATIN SMALL LETTER Y WITH MACRON + * Livonian, Cornish + : 0079 0304 +@@ 0250 IPA Extensions 02AF +@ IPA extensions +@+ IPA includes basic Latin letters and a number of Latin letters from other blocks. + x (latin small letter ae - 00E6) + x (latin small letter c with cedilla - 00E7) + x (latin small letter eth - 00F0) + x (latin small letter o with stroke - 00F8) + x (latin small letter h with stroke - 0127) + x (latin small letter eng - 014B) + x (latin small ligature oe - 0153) + x (greek small letter beta - 03B2) + x (greek small letter theta - 03B8) + x (greek small letter lamda - 03BB) + x (greek small letter chi - 03C7) +0250 LATIN SMALL LETTER TURNED A + * low central unrounded vowel +0251 LATIN SMALL LETTER ALPHA + = LATIN SMALL LETTER SCRIPT A + * low back unrounded vowel + x (greek small letter alpha - 03B1) +0252 LATIN SMALL LETTER TURNED ALPHA + * low back rounded vowel +0253 LATIN SMALL LETTER B WITH HOOK + * implosive bilabial stop + * Pan-Nigerian alphabet + x (latin capital letter b with hook - 0181) +0254 LATIN SMALL LETTER OPEN O + * typographically a turned c + * lower-mid back rounded vowel + x (latin capital letter open o - 0186) +0255 LATIN SMALL LETTER C WITH CURL + * voiceless alveolo-palatal laminal fricative + * used in transcription of Mandarin Chinese + * sound spelled with 015B in Polish +0256 LATIN SMALL LETTER D WITH TAIL + = LATIN SMALL LETTER D RETROFLEX HOOK + * voiced retroflex stop + x (latin capital letter african d - 0189) +0257 LATIN SMALL LETTER D WITH HOOK + * implosive dental or alveolar stop + * Ewe, Pan-Nigerian alphabet + x (latin capital letter d with hook - 018A) +0258 LATIN SMALL LETTER REVERSED E + * upper-mid central unrounded vowel +0259 LATIN SMALL LETTER SCHWA + * mid-central unrounded vowel + * variant uppercase form 018E is associated with 01DD + x (latin capital letter schwa - 018F) + x (latin small letter turned e - 01DD) + x (cyrillic small letter schwa - 04D9) +025A LATIN SMALL LETTER SCHWA WITH HOOK + * rhotacized schwa +025B LATIN SMALL LETTER OPEN E + = LATIN SMALL LETTER EPSILON + * lower-mid front unrounded vowel + x (latin capital letter open e - 0190) + x (greek small letter epsilon - 03B5) +025C LATIN SMALL LETTER REVERSED OPEN E + * lower-mid central unrounded vowel +025D LATIN SMALL LETTER REVERSED OPEN E WITH HOOK + * rhotacized lower-mid central vowel +025E LATIN SMALL LETTER CLOSED REVERSED OPEN E + = LATIN SMALL LETTER CLOSED REVERSED EPSILON + * lower-mid central rounded vowel +025F LATIN SMALL LETTER DOTLESS J WITH STROKE + * voiced palatal stop + * typographically a turned f, but better thought of as a form of j + * "gy" in Hungarian orthography + * also archaic phonetic for palatoalveolar affricate 02A4 +0260 LATIN SMALL LETTER G WITH HOOK + * implosive velar stop + x (latin capital letter g with hook - 0193) +0261 LATIN SMALL LETTER SCRIPT G + * voiced velar stop + x (latin small letter g - 0067) +0262 LATIN LETTER SMALL CAPITAL G + * voiced uvular stop +0263 LATIN SMALL LETTER GAMMA + * voiced velar fricative + x (latin capital letter gamma - 0194) + x (greek small letter gamma - 03B3) +0264 LATIN SMALL LETTER RAMS HORN + = LATIN SMALL LETTER BABY GAMMA + * upper-mid back unrounded vowel +0265 LATIN SMALL LETTER TURNED H + * voiced rounded palatal approximant +0266 LATIN SMALL LETTER H WITH HOOK + * breathy-voiced glottal fricative + x (modifier letter small h with hook - 02B1) +0267 LATIN SMALL LETTER HENG WITH HOOK + * voiceless coarticulated velar and palatoalveolar fricative + * "tj" or "kj" or "sj" in some Swedish dialects +0268 LATIN SMALL LETTER I WITH STROKE + = barred i, i bar + * high central unrounded vowel + * ISO 6438 gives lowercase of 0197 as 026A, not 0268 +0269 LATIN SMALL LETTER IOTA + * semi-high front unrounded vowel +@+ * obsoleted by IPA in 1989 + * preferred use is 026A LATIN LETTER SMALL CAPITAL I + x (latin capital letter iota - 0196) + x (greek small letter iota - 03B9) +026A LATIN LETTER SMALL CAPITAL I + * semi-high front unrounded vowel + * preferred IPA alternate for 0269 + x (latin capital letter i with stroke - 0197) +026B LATIN SMALL LETTER L WITH MIDDLE TILDE + * velarized voiced alveolar lateral approximant +026C LATIN SMALL LETTER L WITH BELT + * voiceless alveolar lateral fricative +026D LATIN SMALL LETTER L WITH RETROFLEX HOOK + * voiced retroflex lateral +026E LATIN SMALL LETTER LEZH + * voiced lateral fricative + * "dhl" in Zulu orthography +026F LATIN SMALL LETTER TURNED M + * high back unrounded vowel + x (latin capital letter turned m - 019C) +0270 LATIN SMALL LETTER TURNED M WITH LONG LEG + * voiced velar approximant +0271 LATIN SMALL LETTER M WITH HOOK + * voiced labiodental nasal +0272 LATIN SMALL LETTER N WITH LEFT HOOK + * voiced palatal nasal + x (latin capital letter n with left hook - 019D) +0273 LATIN SMALL LETTER N WITH RETROFLEX HOOK + * voiced retroflex nasal +0274 LATIN LETTER SMALL CAPITAL N + * voiced uvular nasal +0275 LATIN SMALL LETTER BARRED O + = o bar + * rounded mid-central vowel, i.e. rounded schwa + * uppercase is 019F + x (greek small letter theta - 03B8) + x (cyrillic small letter fita - 0473) + x (cyrillic small letter barred o - 04E9) +0276 LATIN LETTER SMALL CAPITAL OE + * low front rounded vowel + x (latin small ligature oe - 0153) +0277 LATIN SMALL LETTER CLOSED OMEGA + * semi-high back rounded vowel +@+ * obsoleted by IPA in 1989 + * preferred use is 028A latin small letter upsilon +0278 LATIN SMALL LETTER PHI + * voiceless bilabial fricative + x (greek small letter phi - 03C6) +0279 LATIN SMALL LETTER TURNED R + * voiced alveolar approximant + x (modifier letter small turned r - 02B4) +027A LATIN SMALL LETTER TURNED R WITH LONG LEG + * voiced lateral flap +027B LATIN SMALL LETTER TURNED R WITH HOOK + * voiced retroflex approximant + x (modifier letter small turned r with hook - 02B5) +027C LATIN SMALL LETTER R WITH LONG LEG + * voiced strident apico-alveolar trill +@+ * obsoleted by IPA in 1989 + * sound spelled with 0159 in Czech + * preferred phonetic representation for Czech is 0072 031D + * in current use in Gaelic types (as glyph variant of 0072) +027D LATIN SMALL LETTER R WITH TAIL + * voiced retroflex flap +027E LATIN SMALL LETTER R WITH FISHHOOK + * voiced alveolar flap or tap +027F LATIN SMALL LETTER REVERSED R WITH FISHHOOK + * apical dental vowel + * used in Sinological tradition + * IPA spelling - 007A 0329 +0280 LATIN LETTER SMALL CAPITAL R * + * voiced uvular trill + * Germanic, Old Norse + * uppercase is 01A6 +0281 LATIN LETTER SMALL CAPITAL INVERTED R + * voiced uvular fricative or approximant + x (modifier letter small capital inverted r - 02B6) +0282 LATIN SMALL LETTER S WITH HOOK + * voiceless retroflex fricative +0283 LATIN SMALL LETTER ESH + * voiceless postalveolar fricative + x (latin capital letter esh - 01A9) + x (integral - 222B) +0284 LATIN SMALL LETTER DOTLESS J WITH STROKE AND HOOK + * implosive palatal stop + * typographically based on 025F, not on 0283 +0285 LATIN SMALL LETTER SQUAT REVERSED ESH + * apical retroflex vowel + * used in Sinological tradition + * IPA spelling - 0290 0329 +0286 LATIN SMALL LETTER ESH WITH CURL + * palatalized voiceless postalveolar fricative + * suggested spelling - 0283 02B2 +0287 LATIN SMALL LETTER TURNED T + * dental click (sound of "tsk tsk") + x (latin letter dental click - 01C0) +0288 LATIN SMALL LETTER T WITH RETROFLEX HOOK + * voiceless retroflex stop + x (latin capital letter t with retroflex hook - 01AE) +0289 LATIN SMALL LETTER U BAR + * high central rounded vowel +028A LATIN SMALL LETTER UPSILON + * semi-high back rounded vowel + * preferred IPA alternate to 0277 + x (latin capital letter upsilon - 01B1) + x (greek small letter upsilon - 03C5) +028B LATIN SMALL LETTER V WITH HOOK + = LATIN SMALL LETTER SCRIPT V + * voiced labiodental approximant + x (latin capital letter v with hook - 01B2) + x (greek small letter upsilon - 03C5) +028C LATIN SMALL LETTER TURNED V + = caret, wedge + * lower-mid back unrounded vowel + x (greek capital letter lamda - 039B) + x (caret - 2038) + x (logical and - 2227) +028D LATIN SMALL LETTER TURNED W + * voiceless rounded labiovelar approximant +028E LATIN SMALL LETTER TURNED Y + * voiced lateral approximant +028F LATIN LETTER SMALL CAPITAL Y + * semi-high front rounded vowel +0290 LATIN SMALL LETTER Z WITH RETROFLEX HOOK + * voiced retroflex fricative +0291 LATIN SMALL LETTER Z WITH CURL + * voiced alveolo-palatal laminal fricative + * sound spelled with 017A in Polish +0292 LATIN SMALL LETTER EZH + = LATIN SMALL LETTER YOGH + = dram + * voiced postalveolar fricative + * uppercase is 01B7 + * Skolt Sámi + x (latin small letter yogh - 021D) + x (cyrillic small letter abkhasian dze - 04E1) + x (ounce sign - 2125) +0293 LATIN SMALL LETTER EZH WITH CURL + * palatalized voiced postalveolar fricative +0294 LATIN LETTER GLOTTAL STOP + x (modifier letter glottal stop - 02C0) +0295 LATIN LETTER PHARYNGEAL VOICED FRICATIVE + = LATIN LETTER REVERSED GLOTTAL STOP + * voiced pharyngeal fricative + * ain + x (latin small letter ezh reversed - 01B9) + x (modifier letter reversed glottal stop - 02C1) +0296 LATIN LETTER INVERTED GLOTTAL STOP + * lateral click + x (latin letter lateral click - 01C1) +0297 LATIN LETTER STRETCHED C + * palatal (or alveolar) click + x (latin letter retroflex click - 01C3) + x (complement - 2201) +0298 LATIN LETTER BILABIAL CLICK + = LATIN LETTER BULLSEYE + x (circled dot operator - 2299) +0299 LATIN LETTER SMALL CAPITAL B + * bilabial trill +029A LATIN SMALL LETTER CLOSED OPEN E + = LATIN SMALL LETTER CLOSED EPSILON + * lower-mid front rounded vowel + * non-IPA alternate for the preferred 0153 +029B LATIN LETTER SMALL CAPITAL G WITH HOOK + * voiced uvular implosive +029C LATIN LETTER SMALL CAPITAL H + * voiceless epiglottal fricative +029D LATIN SMALL LETTER J WITH CROSSED-TAIL + * voiced palatal fricative +029E LATIN SMALL LETTER TURNED K + * proposed for velar click +@+ * withdrawn by IPA in 1970 +029F LATIN LETTER SMALL CAPITAL L + * velar lateral approximant +02A0 LATIN SMALL LETTER Q WITH HOOK + * voiceless uvular implosive +02A1 LATIN LETTER GLOTTAL STOP WITH STROKE + * voiced epiglottal stop +02A2 LATIN LETTER REVERSED GLOTTAL STOP WITH STROKE + * voiced epiglottal fricative +02A3 LATIN SMALL LETTER DZ DIGRAPH + * voiced dental affricate +02A4 LATIN SMALL LETTER DEZH DIGRAPH + * voiced postalveolar affricate +02A5 LATIN SMALL LETTER DZ DIGRAPH WITH CURL + * voiced alveolo-palatal affricate +02A6 LATIN SMALL LETTER TS DIGRAPH + * voiceless dental affricate +02A7 LATIN SMALL LETTER TESH DIGRAPH + * voiceless postalveolar affricate +02A8 LATIN SMALL LETTER TC DIGRAPH WITH CURL + * voiceless alveolo-palatal affricate +@ IPA characters for disordered speech +02A9 LATIN SMALL LETTER FENG DIGRAPH + * velopharyngeal fricative +02AA LATIN SMALL LETTER LS DIGRAPH + * lateral alveolar fricative (lisp) +02AB LATIN SMALL LETTER LZ DIGRAPH + * voiced lateral alveolar fricative +02AC LATIN LETTER BILABIAL PERCUSSIVE + * audible lip smack +02AD LATIN LETTER BIDENTAL PERCUSSIVE + * audible teeth gnashing +@@ 02B0 Spacing Modifier Letters 02FF +@ Phonetic modifiers derived from Latin letters +02B0 MODIFIER LETTER SMALL H + * aspiration + # 0068 +02B1 MODIFIER LETTER SMALL H WITH HOOK + * breathy voiced, murmured + x (latin small letter h with hook - 0266) + x (combining diaeresis below - 0324) + # 0266 +02B2 MODIFIER LETTER SMALL J + * palatalization + x (combining palatalized hook below - 0321) + # 006A +02B3 MODIFIER LETTER SMALL R + # 0072 +02B4 MODIFIER LETTER SMALL TURNED R + x (latin small letter turned r - 0279) + # 0279 +02B5 MODIFIER LETTER SMALL TURNED R WITH HOOK + x (latin small letter turned r with hook - 027B) + # 027B +02B6 MODIFIER LETTER SMALL CAPITAL INVERTED R + * preceding four used for r-coloring or r-offglides + x (latin letter small capital inverted r - 0281) + # 0281 +02B7 MODIFIER LETTER SMALL W + * labialization + x (combining inverted double arch below - 032B) + # 0077 +02B8 MODIFIER LETTER SMALL Y + * palatalization + * common Americanist substitution for 02B2 + # 0079 +@ Miscellaneous phonetic modifiers +02B9 MODIFIER LETTER PRIME + * primary stress, emphasis + * transliteration of mjagkij znak (Cyrillic soft sign: palatalization) + x (apostrophe - 0027) + x (acute accent - 00B4) + x (modifier letter acute accent - 02CA) + x (combining acute accent - 0301) + x (greek numeral sign - 0374) + x (prime - 2032) +02BA MODIFIER LETTER DOUBLE PRIME + * exaggerated stress, contrastive stress + * transliteration of tverdyj znak (Cyrillic hard sign: no palatalization) + x (quotation mark - 0022) + x (combining double acute accent - 030B) + x (double prime - 2033) +02BB MODIFIER LETTER TURNED COMMA + * typographical alternate for 02BD or 02BF + x (combining turned comma above - 0312) + x (left single quotation mark - 2018) +02BC MODIFIER LETTER APOSTROPHE + = apostrophe + * glottal stop, glottalization, ejective + * spacing clone of Greek smooth breathing mark + * many languages use this as a letter of their alphabets + x (apostrophe - 0027) + x (combining comma above - 0313) + x (combining comma above right - 0315) + x (armenian apostrophe - 055A) + x (right single quotation mark - 2019) +02BD MODIFIER LETTER REVERSED COMMA + * weak aspiration + * spacing clone of Greek rough breathing mark + x (combining reversed comma above - 0314) + x (armenian modifier letter left half ring - 0559) + x (single high-reversed-9 quotation mark - 201B) +02BE MODIFIER LETTER RIGHT HALF RING + * transliteration of Arabic hamza (glottal stop) + x (armenian apostrophe - 055A) + x (arabic letter hamza - 0621) +02BF MODIFIER LETTER LEFT HALF RING + * transliteration of Arabic ain (voiced pharyngeal fricative) + x (armenian modifier letter left half ring - 0559) + x (arabic letter ain - 0639) +02C0 MODIFIER LETTER GLOTTAL STOP + * ejective or glottalized + * typographical alternate for 02BC or 02BE + x (latin letter glottal stop - 0294) + x (combining hook above - 0309) +02C1 MODIFIER LETTER REVERSED GLOTTAL STOP + * typographical alternate for 02BF + x (latin letter pharyngeal voiced fricative - 0295) +02C2 MODIFIER LETTER LEFT ARROWHEAD + * fronted articulation +02C3 MODIFIER LETTER RIGHT ARROWHEAD + * backed articulation +02C4 MODIFIER LETTER UP ARROWHEAD + * raised articulation + x (circumflex accent - 005E) + x (up arrowhead - 2303) +02C5 MODIFIER LETTER DOWN ARROWHEAD + * lowered articulation +02C6 MODIFIER LETTER CIRCUMFLEX ACCENT + * rising-falling tone, falling tone, secondary stress, etc. + x (circumflex accent - 005E) + x (combining circumflex accent - 0302) +02C7 CARON (Mandarin Chinese third tone) + = hacek + * falling-rising tone + * Mandarin Chinese third tone + x (combining caron - 030C) +02C8 MODIFIER LETTER VERTICAL LINE + * primary stress, downstep + * precedes letter or syllable modified + x (apostrophe - 0027) + x (combining vertical line above - 030D) +02C9 MODIFIER LETTER MACRON (Mandarin Chinese first tone) + * high level tone + * precedes or follows letter or syllable modified + * Mandarin Chinese first tone + x (macron - 00AF) + x (combining macron - 0304) +02CA MODIFIER LETTER ACUTE ACCENT (Mandarin Chinese second tone) + * high-rising tone (IPA), high tone, primary stress + * Mandarin Chinese second tone + x (acute accent - 00B4) + x (modifier letter prime - 02B9) + x (combining acute accent - 0301) + x (greek numeral sign - 0374) + x (armenian emphasis mark - 055B) +02CB MODIFIER LETTER GRAVE ACCENT (Mandarin Chinese fourth tone) + * high-falling tone (IPA), low tone, secondary or tertiary stress + * Mandarin Chinese fourth tone + x (grave accent - 0060) + x (combining grave accent - 0300) + x (armenian comma - 055D) +02CC MODIFIER LETTER LOW VERTICAL LINE + * secondary stress + * precedes letter or syllable modified + x (combining vertical line below - 0329) +02CD MODIFIER LETTER LOW MACRON + * low level tone + x (low line - 005F) + x (combining macron below - 0331) +02CE MODIFIER LETTER LOW GRAVE ACCENT + * low-falling tone +02CF MODIFIER LETTER LOW ACUTE ACCENT + * low-rising tone + x (greek lower numeral sign - 0375) +02D0 MODIFIER LETTER TRIANGULAR COLON + * length mark + x (colon - 003A) +02D1 MODIFIER LETTER HALF TRIANGULAR COLON + * half-length mark + x (middle dot - 00B7) +02D2 MODIFIER LETTER CENTRED RIGHT HALF RING + * more rounded articulation +02D3 MODIFIER LETTER CENTRED LEFT HALF RING + * less rounded articulation +02D4 MODIFIER LETTER UP TACK + * vowel raising or closing + x (combining up tack below - 031D) + x (combining dot below - 0323) +02D5 MODIFIER LETTER DOWN TACK + * vowel lowering or opening + x (combining left half ring below - 031C) + x (combining down tack below - 031E) +02D6 MODIFIER LETTER PLUS SIGN + * advanced or fronted articulation + x (combining plus sign below - 031F) +02D7 MODIFIER LETTER MINUS SIGN + * retracted or backed articulation + * glyph may have small end-serifs + x (combining minus sign below - 0320) +@ Spacing clones of diacritics +02D8 BREVE + x (combining breve - 0306) + # 0020 0306 +02D9 DOT ABOVE (Mandarin Chinese light tone) + * Mandarin Chinese fifth tone (light or neutral) + x (combining dot above - 0307) + # 0020 0307 +02DA RING ABOVE + x (degree sign - 00B0) + x (combining ring above - 030A) + # 0020 030A +02DB OGONEK + x (combining ogonek - 0328) + # 0020 0328 +02DC SMALL TILDE + x (tilde - 007E) + x (combining tilde - 0303) + x (tilde operator - 223C) + # 0020 0303 +02DD DOUBLE ACUTE ACCENT + x (combining double acute accent - 030B) + # 0020 030B +@ Additions based on 1989 IPA +02DE MODIFIER LETTER RHOTIC HOOK + * rhotacization in vowel + * often ligated: 025A = 0259 + 02DE; 025D = 025C + 02DE +02DF MODIFIER LETTER CROSS ACCENT + * Swedish grave accent +02E0 MODIFIER LETTER SMALL GAMMA + * these modifier letters are occasionally used in transcription of affricates + # 0263 +02E1 MODIFIER LETTER SMALL L + # 006C +02E2 MODIFIER LETTER SMALL S + # 0073 +02E3 MODIFIER LETTER SMALL X + # 0078 +02E4 MODIFIER LETTER SMALL REVERSED GLOTTAL STOP + # 0295 +@ Tone letters +02E5 MODIFIER LETTER EXTRA-HIGH TONE BAR +02E6 MODIFIER LETTER HIGH TONE BAR +02E7 MODIFIER LETTER MID TONE BAR +02E8 MODIFIER LETTER LOW TONE BAR +02E9 MODIFIER LETTER EXTRA-LOW TONE BAR +02EA MODIFIER LETTER YIN DEPARTING TONE MARK +02EB MODIFIER LETTER YANG DEPARTING TONE MARK +@ IPA modifiers +02EC MODIFIER LETTER VOICING +02ED MODIFIER LETTER UNASPIRATED +@ Other modifier letters +02EE MODIFIER LETTER DOUBLE APOSTROPHE + +2000 EN QUAD + : 2002 en space +2001 EM QUAD + = mutton quad + : 2003 em space +2002 EN SPACE + = nut + * half an em + # 0020 space +2003 EM SPACE + = mutton + * nominally, a space equal to the type size in points + * may scale by the condensation factor of a font + # 0020 space +2004 THREE-PER-EM SPACE + = thick space + # 0020 space +2005 FOUR-PER-EM SPACE + = mid space + # 0020 space +2006 SIX-PER-EM SPACE + * in computer typography sometimes equated to thin space + # 0020 space +2007 FIGURE SPACE + * space equal to tabular width of a font + * this is equivalent to the digit width of fonts with fixed-width digits + # 0020 +2008 PUNCTUATION SPACE + * space equal to narrow punctuation of a font + # 0020 space +2009 THIN SPACE + * a fifth of an em (or sometimes a sixth) + # 0020 space +200A HAIR SPACE + * thinner than a thin space + * in traditional typography, the thinnest space available + # 0020 space +200B ZERO WIDTH SPACE + * nominally zero width, but may expand in justification +@ Formatting characters +200C ZERO WIDTH NON-JOINER + = ZWNJ +200D ZERO WIDTH JOINER + = ZWJ +200E LEFT-TO-RIGHT MARK + = LRM +200F RIGHT-TO-LEFT MARK + = RLM +@ Dashes +2010 HYPHEN + x (hyphen-minus - 002D) +2011 NON-BREAKING HYPHEN + x (hyphen-minus - 002D) + # 2010 +2012 FIGURE DASH +2013 EN DASH +2014 EM DASH + * may be used in pairs to offset parenthetical text + x (katakana-hiragana prolonged sound mark - 30FC) +2015 HORIZONTAL BAR + = QUOTATION DASH + * long dash introducing quoted text +@ General punctuation +2016 DOUBLE VERTICAL LINE + * used in pairs to indicate norm of a matrix + x (parallel to - 2225) +2017 DOUBLE LOW LINE + * this is a spacing character + x (low line - 005F) + x (combining double low line - 0333) + # 0020 0333 +2018 LEFT SINGLE QUOTATION MARK + = SINGLE TURNED COMMA QUOTATION MARK + * this is the preferred glyph (as opposed to 201B) + x (apostrophe - 0027) + x (modifier letter turned comma - 02BB) + x (heavy single turned comma quotation mark ornament - 275B) +2019 RIGHT SINGLE QUOTATION MARK + = SINGLE COMMA QUOTATION MARK + * this is the preferred character to use for apostrophe + x (apostrophe - 0027) + x (modifier letter apostrophe - 02BC) + x (heavy single comma quotation mark ornament - 275C) +201A SINGLE LOW-9 QUOTATION MARK + = LOW SINGLE COMMA QUOTATION MARK + * used as opening single quotation mark in some languages +201B SINGLE HIGH-REVERSED-9 QUOTATION MARK + = SINGLE REVERSED COMMA QUOTATION MARK + * glyph variant of 2018 + x (modifier letter reversed comma - 02BD) +201C LEFT DOUBLE QUOTATION MARK + = DOUBLE TURNED COMMA QUOTATION MARK + * this is the preferred glyph (as opposed to 201F) + x (quotation mark - 0022) + x (heavy double turned comma quotation mark ornament - 275D) + x (reversed double prime quotation mark - 301D) +201D RIGHT DOUBLE QUOTATION MARK + = DOUBLE COMMA QUOTATION MARK + x (quotation mark - 0022) + x (double prime - 2033) + x (heavy double comma quotation mark ornament - 275E) + x (double prime quotation mark - 301E) +201E DOUBLE LOW-9 QUOTATION MARK + = LOW DOUBLE COMMA QUOTATION MARK + * used as opening double quotation mark in some languages + x (low double prime quotation mark - 301F) +201F DOUBLE HIGH-REVERSED-9 QUOTATION MARK + = DOUBLE REVERSED COMMA QUOTATION MARK + * glyph variant of 201C +2020 DAGGER + = obelisk, obelus, long cross +2021 DOUBLE DAGGER + = diesis, double obelisk +2022 BULLET + = black small circle + x (middle dot - 00B7) + x (one dot leader - 2024) + x (bullet operator - 2219) + x (inverse bullet - 25D8) + x (white bullet - 25E6) +2023 TRIANGULAR BULLET + x (end of proof - 220E) + x (black right-pointing small triangle - 25B8) +2024 ONE DOT LEADER + x (middle dot - 00B7) + x (bullet - 2022) + x (bullet operator - 2219) + # 002E full stop +2025 TWO DOT LEADER + # 002E 002E +2026 HORIZONTAL ELLIPSIS + = three dot leader + x (vertical ellipsis - 22EE) + # 002E 002E 002E +2027 HYPHENATION POINT +@ Formatting characters +2028 LINE SEPARATOR + * may be used to represent this semantic unambiguously +2029 PARAGRAPH SEPARATOR + * may be used to represent this semantic unambiguously +202A LEFT-TO-RIGHT EMBEDDING + = LRE +202B RIGHT-TO-LEFT EMBEDDING + = RLE +202C POP DIRECTIONAL FORMATTING + = PDF +202D LEFT-TO-RIGHT OVERRIDE + = LRO +202E RIGHT-TO-LEFT OVERRIDE + = RLO +202F NARROW NO-BREAK SPACE + x (no-break space - 00A0) + # 0020 +@ General punctuation +2030 PER MILLE SIGN + x (percent sign - 0025) +2031 PER TEN THOUSAND SIGN + x (percent sign - 0025) +2032 PRIME + = minutes, feet + x (apostrophe - 0027) + x (acute accent - 00B4) + x (modifier letter prime - 02B9) +2033 DOUBLE PRIME + = seconds, inches + x (quotation mark - 0022) + x (modifier letter double prime - 02BA) + x (right double quotation mark - 201D) + x (ditto mark - 3003) + x (double prime quotation mark - 301E) + # 2032 2032 +2034 TRIPLE PRIME + # 2032 2032 2032 +2035 REVERSED PRIME + x (grave accent - 0060) +2036 REVERSED DOUBLE PRIME + x (reversed double prime quotation mark - 301D) + # 2035 2035 +2037 REVERSED TRIPLE PRIME + # 2035 2035 2035 +2038 CARET + x (up arrowhead - 2303) +2039 SINGLE LEFT-POINTING ANGLE QUOTATION MARK + = LEFT POINTING SINGLE GUILLEMET + * usually opening, sometimes closing + x (less-than sign - 003C) + x (left-pointing angle bracket - 2329) + x (left angle bracket - 3008) +203A SINGLE RIGHT-POINTING ANGLE QUOTATION MARK + = RIGHT POINTING SINGLE GUILLEMET + * usually closing, sometimes opening + x (greater-than sign - 003E) + x (right-pointing angle bracket - 232A) + x (right angle bracket - 3009) +203B REFERENCE MARK + = Japanese kome + = Urdu paragraph separator + x (tibetan ku ru kha bzhi mig can - 0FBF) +203C DOUBLE EXCLAMATION MARK + x (exclamation mark - 0021) + # 0021 0021 +203D INTERROBANG + x (exclamation mark - 0021) + x (question mark - 003F) +203E OVERLINE + = SPACING OVERSCORE + # 0020 0305 +203F UNDERTIE (Enotikon) + = Greek enotikon + x (smile - 2323) +2040 CHARACTER TIE + x (frown - 2322) +2041 CARET INSERTION POINT + * proofreader's mark: insert here + x (right semidirect product - 22CC) +2042 ASTERISM +2043 HYPHEN BULLET +2044 FRACTION SLASH + = solidus (in typography) + * for composing arbitrary fractions + x (solidus - 002F) + x (division slash - 2215) +2045 LEFT SQUARE BRACKET WITH QUILL +2046 RIGHT SQUARE BRACKET WITH QUILL +2048 QUESTION EXCLAMATION MARK + * designed for use in vertical text + # 003F 0021 +2049 EXCLAMATION QUESTION MARK + * designed for use in vertical text + # 0021 003F +204A TIRONIAN SIGN ET + * Irish Gaelic, ... +204B REVERSED PILCROW SIGN + x (pilcrow sign - 00B6) +204C BLACK LEFTWARDS BULLET +204D BLACK RIGHTWARDS BULLET +@ Deprecated +206A INHIBIT SYMMETRIC SWAPPING +206B ACTIVATE SYMMETRIC SWAPPING +206C INHIBIT ARABIC FORM SHAPING +206D ACTIVATE ARABIC FORM SHAPING +206E NATIONAL DIGIT SHAPES +206F NOMINAL DIGIT SHAPES +@@ 2070 Superscripts and Subscripts 209F +@ Superscripts +2070 SUPERSCRIPT ZERO + # 0030 +2071 + x (superscript one - 00B9) +2072 + x (superscript two - 00B2) +2073 + x (superscript three - 00B3) +2074 SUPERSCRIPT FOUR + # 0034 +2075 SUPERSCRIPT FIVE + # 0035 +2076 SUPERSCRIPT SIX + # 0036 +2077 SUPERSCRIPT SEVEN + # 0037 +2078 SUPERSCRIPT EIGHT + # 0038 +2079 SUPERSCRIPT NINE + # 0039 +207A SUPERSCRIPT PLUS SIGN + # 002B +207B SUPERSCRIPT MINUS + # 2212 +207C SUPERSCRIPT EQUALS SIGN + # 003D +207D SUPERSCRIPT LEFT PARENTHESIS + # 0028 +207E SUPERSCRIPT RIGHT PARENTHESIS + # 0029 +207F SUPERSCRIPT LATIN SMALL LETTER N + # 006E +@ Subscripts +2080 SUBSCRIPT ZERO + # 0030 +2081 SUBSCRIPT ONE + # 0031 +2082 SUBSCRIPT TWO + # 0032 +2083 SUBSCRIPT THREE + # 0033 +2084 SUBSCRIPT FOUR + # 0034 +2085 SUBSCRIPT FIVE + # 0035 +2086 SUBSCRIPT SIX + # 0036 +2087 SUBSCRIPT SEVEN + # 0037 +2088 SUBSCRIPT EIGHT + # 0038 +2089 SUBSCRIPT NINE + # 0039 +208A SUBSCRIPT PLUS SIGN + # 002B +208B SUBSCRIPT MINUS + # 2212 +208C SUBSCRIPT EQUALS SIGN + # 003D +208D SUBSCRIPT LEFT PARENTHESIS + # 0028 +208E SUBSCRIPT RIGHT PARENTHESIS + # 0029 +@@ 20A0 Currency Symbols 20CF +@ Currency symbols +@+ A number of currency symbols are found in other blocks. + x (dollar sign - 0024) + x (cent sign - 00A2) + x (pound sign - 00A3) + x (currency sign - 00A4) + x (yen sign - 00A5) + x (bengali rupee mark - 09F2) + x (bengali rupee sign - 09F3) + x (thai currency symbol baht - 0E3F) + x (khmer currency symbol riel - 17DB) +20A0 EURO-CURRENCY SIGN + * intended for ECU, but not widely used + * historical character, this is NOT the euro! + x (euro sign - 20AC) +20A1 COLON SIGN + * Costa Rica, El Salvador +20A2 CRUZEIRO SIGN + * Brazil +20A3 FRENCH FRANC SIGN + * France +20A4 LIRA SIGN + * Italy, Turkey + x (pound sign - 00A3) +20A5 MILL SIGN + * USA (1/10 cent) +20A6 NAIRA SIGN + * Nigeria +20A7 PESETA SIGN + * Spain +20A8 RUPEE SIGN + * India + # 0052 0073 +20A9 WON SIGN + * Korea +20AA NEW SHEQEL SIGN + * Israel +20AB DONG SIGN + * Vietnam +20AC EURO SIGN + * currency sign for the European Monetary Union + * euro, not ECU + x (euro-currency sign - 20A0) +20AD KIP SIGN + * Laos +20AE TUGRIK SIGN + * Mongolia + * also transliterated as tugrug, tugric, tugrog, togrog +20AF DRACHMA SIGN + * Greece +@@ 20D0 Combining Diacritical Marks for Symbols 20FF +@ Combining diacritical marks for symbols +20D0 COMBINING LEFT HARPOON ABOVE +20D1 COMBINING RIGHT HARPOON ABOVE + * vector +20D2 COMBINING LONG VERTICAL LINE OVERLAY +20D3 COMBINING SHORT VERTICAL LINE OVERLAY + * negation +20D4 COMBINING ANTICLOCKWISE ARROW ABOVE +20D5 COMBINING CLOCKWISE ARROW ABOVE + * rotation +20D6 COMBINING LEFT ARROW ABOVE +20D7 COMBINING RIGHT ARROW ABOVE + * vector +20D8 COMBINING RING OVERLAY +20D9 COMBINING CLOCKWISE RING OVERLAY +20DA COMBINING ANTICLOCKWISE RING OVERLAY +20DB COMBINING THREE DOTS ABOVE + = third derivative +20DC COMBINING FOUR DOTS ABOVE + = fourth derivative +@ Enclosing diacritics +20DD COMBINING ENCLOSING CIRCLE + = JIS composition circle + x (white circle - 25CB) + x (large circle - 25EF) + x (ideographic number zero - 3007) +20DE COMBINING ENCLOSING SQUARE + x (white square - 25A1) +20DF COMBINING ENCLOSING DIAMOND + x (white diamond - 25C7) +20E0 COMBINING ENCLOSING CIRCLE BACKSLASH + * prohibition +@ Additional diacritical mark for symbols +20E1 COMBINING LEFT RIGHT ARROW ABOVE + * tensor +@ Additional enclosing diacritics +20E2 COMBINING ENCLOSING SCREEN + x (clear screen symbol - 239A) +20E3 COMBINING ENCLOSING KEYCAP + +*/ +