# SuperScriptFolding.txt # DRAFT 1 - 2004-05-22 Asmus Freytag # Subject to change # # Base version of Unicode: 4.0.0 # # # Datafile for Unicode Techical Report #30 # Copyright (c) 1991-2004 Unicode, Inc. # For terms of use, and documentation see # http://www.unicode.org/reports/tr30/ # ================================= # # Map all characters that are superscripted forms to their equivalent letter # # Format # Field 0 - character code (source) # Field 1 - character code of code sequnece (target) # Comment - descriptive name, of the source character # # Notes: # # 1) This is a superset of characters with the compatibility # decomposition # # Stability # The repertoire of modifier letters is not yet complete, therefore # this file would need to change whenever additional modifier # letters are added to the Unicode Standard. # ########################################################################### # characters with compatibility decomposition in UnicodeData.txt 00AA;a # ª → a FEMININE ORDINAL INDICATOR → a 00B2;2 # ² → 2 SUPERSCRIPT TWO → 2 00B3;3 # ³ → 3 SUPERSCRIPT THREE → 3 00B9;1 # ¹ → 1 SUPERSCRIPT ONE → 1 00BA;o # º → o MASCULINE ORDINAL INDICATOR → o 02B0;h # ʰ → h MODIFIER LETTER SMALL H → h 02B1; 0266 # ʱ → ɦ MODIFIER LETTER SMALL H WITH HOOK → LATIN SMALL LETTER H WITH HOOK 02B2;j # ʲ → j MODIFIER LETTER SMALL J → j 02B3;r # ʳ → r MODIFIER LETTER SMALL R → r 02B4; 0279 # ʴ → ɹ MODIFIER LETTER SMALL TURNED R → LATIN SMALL LETTER TURNED R 02B5; 027B # ʵ → ɻ MODIFIER LETTER SMALL TURNED R WITH HOOK → LATIN SMALL LETTER TURNED R WITH HOOK 02B6; 0281 # ʶ → ʁ MODIFIER LETTER SMALL CAPITAL INVERTED R → LATIN LETTER SMALL CAPITAL INVERTED R 02B7;w # ʷ → w MODIFIER LETTER SMALL W → w 02B8;y # ʸ → y MODIFIER LETTER SMALL Y → y 02E0; 0263 # ˠ → ɣ MODIFIER LETTER SMALL GAMMA → LATIN SMALL LETTER GAMMA 02E1;l # ˡ → l MODIFIER LETTER SMALL L → l 02E2;s # ˢ → s MODIFIER LETTER SMALL S → s 02E3;x # ˣ → x MODIFIER LETTER SMALL X → x 02E4; 0295 # ˤ → ʕ MODIFIER LETTER SMALL REVERSED GLOTTAL STOP → LATIN LETTER PHARYNGEAL VOICED FRICATIVE 1D2C;A # ᴬ → A MODIFIER LETTER CAPITAL A → A 1D2D; 00C6 # ᴭ → Æ MODIFIER LETTER CAPITAL AE → LATIN CAPITAL LETTER AE 1D2E;B # ᴮ → B MODIFIER LETTER CAPITAL B → B 1D30;D # ᴰ → D MODIFIER LETTER CAPITAL D → D 1D31;E # ᴱ → E MODIFIER LETTER CAPITAL E → E 1D32; 018E # ᴲ → Ǝ MODIFIER LETTER CAPITAL REVERSED E → LATIN CAPITAL LETTER REVERSED E 1D33;G # ᴳ → G MODIFIER LETTER CAPITAL G → G 1D34;H # ᴴ → H MODIFIER LETTER CAPITAL H → H 1D35;I # ᴵ → I MODIFIER LETTER CAPITAL I → I 1D36;J # ᴶ → J MODIFIER LETTER CAPITAL J → J 1D37;K # ᴷ → K MODIFIER LETTER CAPITAL K → K 1D38;L # ᴸ → L MODIFIER LETTER CAPITAL L → L 1D39;M # ᴹ → M MODIFIER LETTER CAPITAL M → M 1D3A;N # ᴺ → N MODIFIER LETTER CAPITAL N → N 1D3C;O # ᴼ → O MODIFIER LETTER CAPITAL O → O 1D3D; 0222 # ᴽ → Ȣ MODIFIER LETTER CAPITAL OU → LATIN CAPITAL LETTER OU 1D3E;P # ᴾ → P MODIFIER LETTER CAPITAL P → P 1D3F;R # ᴿ → R MODIFIER LETTER CAPITAL R → R 1D40;T # ᵀ → T MODIFIER LETTER CAPITAL T → T 1D41;U # ᵁ → U MODIFIER LETTER CAPITAL U → U 1D42;W # ᵂ → W MODIFIER LETTER CAPITAL W → W 1D43;a # ᵃ → a MODIFIER LETTER SMALL A → a 1D44; 0250 # ᵄ → ɐ MODIFIER LETTER SMALL TURNED A → LATIN SMALL LETTER TURNED A 1D45; 0251 # ᵅ → ɑ MODIFIER LETTER SMALL ALPHA → LATIN SMALL LETTER ALPHA 1D46; 1D02 # ᵆ → ᴂ MODIFIER LETTER SMALL TURNED AE → LATIN SMALL LETTER TURNED AE 1D47;b # ᵇ → b MODIFIER LETTER SMALL B → b 1D48;d # ᵈ → d MODIFIER LETTER SMALL D → d 1D49;e # ᵉ → e MODIFIER LETTER SMALL E → e 1D4A; 0259 # ᵊ → ə MODIFIER LETTER SMALL SCHWA → LATIN SMALL LETTER SCHWA 1D4B; 025B # ᵋ → ɛ MODIFIER LETTER SMALL OPEN E → LATIN SMALL LETTER OPEN E 1D4C; 025C # ᵌ → ɜ MODIFIER LETTER SMALL TURNED OPEN E → LATIN SMALL LETTER REVERSED OPEN E 1D4D;g # ᵍ → g MODIFIER LETTER SMALL G → g 1D4F;k # ᵏ → k MODIFIER LETTER SMALL K → k 1D50;m # ᵐ → m MODIFIER LETTER SMALL M → m 1D51; 014B # ᵑ → ŋ MODIFIER LETTER SMALL ENG → LATIN SMALL LETTER ENG 1D52;o # ᵒ → o MODIFIER LETTER SMALL O → o 1D53; 0254 # ᵓ → ɔ MODIFIER LETTER SMALL OPEN O → LATIN SMALL LETTER OPEN O 1D54; 1D16 # ᵔ → ᴖ MODIFIER LETTER SMALL TOP HALF O → LATIN SMALL LETTER TOP HALF O 1D55; 1D17 # ᵕ → ᴗ MODIFIER LETTER SMALL BOTTOM HALF O → LATIN SMALL LETTER BOTTOM HALF O 1D56;p # ᵖ → p MODIFIER LETTER SMALL P → p 1D57;t # ᵗ → t MODIFIER LETTER SMALL T → t 1D58;u # ᵘ → u MODIFIER LETTER SMALL U → u 1D59; 1D1D # ᵙ → ᴝ MODIFIER LETTER SMALL SIDEWAYS U → LATIN SMALL LETTER SIDEWAYS U 1D5A; 026F # ᵚ → ɯ MODIFIER LETTER SMALL TURNED M → LATIN SMALL LETTER TURNED M 1D5B;v # ᵛ → v MODIFIER LETTER SMALL V → v 1D5C; 1D25 # ᵜ → ᴥ MODIFIER LETTER SMALL AIN → LATIN LETTER AIN 1D5D; 03B2 # ᵝ → β MODIFIER LETTER SMALL BETA → GREEK SMALL LETTER BETA 1D5E; 03B3 # ᵞ → γ MODIFIER LETTER SMALL GREEK GAMMA → GREEK SMALL LETTER GAMMA 1D5F; 03B4 # ᵟ → δ MODIFIER LETTER SMALL DELTA → GREEK SMALL LETTER DELTA 1D60; 03C6 # ᵠ → φ MODIFIER LETTER SMALL GREEK PHI → GREEK SMALL LETTER PHI 1D61; 03C7 # ᵡ → χ MODIFIER LETTER SMALL CHI → GREEK SMALL LETTER CHI 2070;0 # ⁰ → 0 SUPERSCRIPT ZERO → 0 2071;i # ⁱ → i SUPERSCRIPT LATIN SMALL LETTER I → i 2074;4 # ⁴ → 4 SUPERSCRIPT FOUR → 4 2075;5 # ⁵ → 5 SUPERSCRIPT FIVE → 5 2076;6 # ⁶ → 6 SUPERSCRIPT SIX → 6 2077;7 # ⁷ → 7 SUPERSCRIPT SEVEN → 7 2078;8 # ⁸ → 8 SUPERSCRIPT EIGHT → 8 2079;9 # ⁹ → 9 SUPERSCRIPT NINE → 9 207A;+ # ⁺ → + SUPERSCRIPT PLUS SIGN → + 207B; 2212 # ⁻ → − SUPERSCRIPT MINUS → MINUS SIGN 207C;= # ⁼ → = SUPERSCRIPT EQUALS SIGN → = 207D;( # ⁽ → ( SUPERSCRIPT LEFT PARENTHESIS → ( 207E;) # ⁾ → ) SUPERSCRIPT RIGHT PARENTHESIS → ) 207F;n # ⁿ → n SUPERSCRIPT LATIN SMALL LETTER N → n 2120;SM # ℠ → SM SERVICE MARK → SM 2122;TM # ™ → TM TRADE MARK SIGN → TM 3192; 4E00 # ㆒ → 一 IDEOGRAPHIC ANNOTATION ONE MARK → CJK UNIFIED IDEOGRAPH-4E00 3193; 4E8C # ㆓ → 二 IDEOGRAPHIC ANNOTATION TWO MARK → CJK UNIFIED IDEOGRAPH-4E8C 3194; 4E09 # ㆔ → 三 IDEOGRAPHIC ANNOTATION THREE MARK → CJK UNIFIED IDEOGRAPH-4E09 3195; 56DB # ㆕ → 四 IDEOGRAPHIC ANNOTATION FOUR MARK → CJK UNIFIED IDEOGRAPH-56DB 3196; 4E0A # ㆖ → 上 IDEOGRAPHIC ANNOTATION TOP MARK → CJK UNIFIED IDEOGRAPH-4E0A 3197; 4E2D # ㆗ → 中 IDEOGRAPHIC ANNOTATION MIDDLE MARK → CJK UNIFIED IDEOGRAPH-4E2D 3198; 4E0B # ㆘ → 下 IDEOGRAPHIC ANNOTATION BOTTOM MARK → CJK UNIFIED IDEOGRAPH-4E0B 3199; 7532 # ㆙ → 甲 IDEOGRAPHIC ANNOTATION FIRST MARK → CJK UNIFIED IDEOGRAPH-7532 319A; 4E59 # ㆚ → 乙 IDEOGRAPHIC ANNOTATION SECOND MARK → CJK UNIFIED IDEOGRAPH-4E59 319B; 4E19 # ㆛ → 丙 IDEOGRAPHIC ANNOTATION THIRD MARK → CJK UNIFIED IDEOGRAPH-4E19 319C; 4E01 # ㆜ → 丁 IDEOGRAPHIC ANNOTATION FOURTH MARK → CJK UNIFIED IDEOGRAPH-4E01 319D; 5929 # ㆝ → 天 IDEOGRAPHIC ANNOTATION HEAVEN MARK → CJK UNIFIED IDEOGRAPH-5929 319E; 5730 # ㆞ → 地 IDEOGRAPHIC ANNOTATION EARTH MARK → CJK UNIFIED IDEOGRAPH-5730 319F; 4EBA # ㆟ → 人 IDEOGRAPHIC ANNOTATION MAN MARK → CJK UNIFIED IDEOGRAPH-4EBA # other characters that are superscripted forms 02C0; 0294 # ˀ → ʔ MODIFIER LETTER GLOTTAL STOP → LATIN LETTER GLOTTAL STOP 02C1; 0295 # ˁ → ʕ MODIFIER LETTER REVERSED GLOTTAL STOP → LATIN LETTER PHARYNGEAL VOICED FRICATIVE 06E5; 0648 # ۥ → و ARABIC SMALL WAW → ARABIC LETTER WAW 06E6; 064A # ۦ → ي ARABIC SMALL YEH → ARABIC LETTER YEH