Back to index

tetex-bin  3.0
encodings.c
Go to the documentation of this file.
00001 /* The unicode2adobe structure and the adobe2unicode_table mapping is taken
00002    from the catdvi (v0.12) `adobetbl.h' source file; it has the following copyright:
00003 
00004    catdvi - get text from DVI files
00005    Copyright (C) 1999 Antti-Juhani Kaijanaho <gaia@iki.fi>
00006    Copyright (C) 2001 Bjoern Brill <brill@fs.math.uni-frankfurt.de>
00007 
00008    This program is free software; you can redistribute it and/or modify
00009    it under the terms of the GNU General Public License as published by
00010    the Free Software Foundation; either version 2 of the License, or
00011    (at your option) any later version.
00012 
00013    This program is distributed in the hope that it will be useful,
00014    but WITHOUT ANY WARRANTY; without even the implied warranty of
00015    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
00016    GNU General Public License for more details.
00017 
00018    You should have received a copy of the GNU General Public License
00019    along with this program; if not, write to the Free Software
00020    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
00021 */
00022 
00023 /* Other parts are adapted from the GNU `iconv' library,
00024    (search for `iconv'), which has the following copyright:
00025  
00026    Copyright (C) 1999-2001 Free Software Foundation, Inc.
00027  
00028    The GNU LIBICONV Library is free software; you can redistribute it
00029    and/or modify it under the terms of the GNU Library General Public
00030    License as published by the Free Software Foundation; either version 2
00031    of the License, or (at your option) any later version.
00032    
00033    The GNU LIBICONV Library is distributed in the hope that it will be
00034    useful, but WITHOUT ANY WARRANTY; without even the implied warranty of
00035    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
00036    Library General Public License for more details.
00037    
00038    You should have received a copy of the GNU Library General Public
00039    License along with the GNU LIBICONV Library; see the file COPYING.LIB.
00040    If not, write to the Free Software Foundation, Inc., 59 Temple Place -
00041    Suite 330, Boston, MA 02111-1307, USA.
00042 */
00043 
00044 
00045 /* The rest of the file is Copyright (c) 2003-2004 the xdvik development team
00046 
00047    Permission is hereby granted, free of charge, to any person obtaining a copy
00048    of this software and associated documentation files (the "Software"), to
00049    deal in the Software without restriction, including without limitation the
00050    rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
00051    sell copies of the Software, and to permit persons to whom the Software is
00052    furnished to do so, subject to the following conditions:
00053 
00054    The above copyright notice and this permission notice shall be included in
00055    all copies or substantial portions of the Software.
00056 
00057    THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
00058    IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
00059    FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
00060    PAUL VOJTA OR ANY OTHER AUTHOR OF THIS SOFTWARE BE LIABLE FOR ANY CLAIM,
00061    DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
00062    ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
00063    OTHER DEALINGS IN THE SOFTWARE.
00064 */
00065 
00066 #include "xdvi-config.h"
00067 #include "xdvi.h"
00068 
00069 #if HAVE_ICONV_H
00070 # include <iconv.h>
00071 static iconv_t m_iconv_gb_ucs4 = (iconv_t)(-1);
00072 #else
00073 static Boolean warned_about_cjk = False;
00074 #endif /* HAVE_ICONV_H */
00075 
00076 #include <ctype.h>
00077 
00078 #include "util.h"
00079 #include "encodings.h"
00080 #include "my-snprintf.h"
00081 #include "message-window.h"
00082 
00083 #define MY_DEBUG 0
00084 
00085 #if MY_DEBUG
00086 # define TRACE_FIND_VERBOSE(x) TRACE_FIND(x)
00087 #else
00088 # define TRACE_FIND_VERBOSE(x) /* as nothing */
00089 #endif
00090 
00091 /*
00092   The following encoding vectors are copied from catdvi's enc/xyz.h files;
00093   only the `.notdef' values have been replaced by 0 instead of 0x003f
00094   (question mark) to make the mapping more flexible.
00095 */
00096 
00097 /* from enc/texmsym.h */
00098 static uint32_t m_cm_symbol_encoding[256] = {
00099     0x2212, 0x00b7, 0x00d7, 0x2217, 0x00f7, 0x22c4, 0x00b1, 0x2213,
00100     0x2295, 0x2296, 0x2297, 0x2298, 0x2299, 0x25ef, 0x25e6, 0x2022,
00101     /* 0x10 */
00102     0x224d, 0x2261, 0x2286, 0x2287, 0x2264, 0x2265, 0x227c, 0x227d,
00103     0x223c, 0x2248, 0x2282, 0x2283, 0x226a, 0x226b, 0x227a, 0x227b,
00104     /* 0x20 */
00105     0x2190, 0x2192, 0x2191, 0x2193, 0x2194, 0x2197, 0x2198, 0x2243,
00106     0x21d0, 0x21d2, 0x21d1, 0x21d3, 0x21d4, 0x2196, 0x2199, 0x221d,
00107     /* 0x30 */
00108     0x2032, 0x221e, 0x2208, 0x220b, 0x25b3, 0x25bd, 0x10fffc, 0,
00109     0x2200, 0x2203, 0x00ac, 0x2205, 0x211c, 0x2111, 0x22a4, 0x22a5,
00110     /* 0x40 */
00111     0x2135, 0x0041, 0x0042, 0x0043, 0x0044, 0x0045, 0x0046, 0x0047,
00112     0x0048, 0x0049, 0x004a, 0x004b, 0x004c, 0x004d, 0x004e, 0x004f,
00113     /* 0x50 */
00114     0x0050, 0x0051, 0x0052, 0x0053, 0x0054, 0x0055, 0x0056, 0x0057,
00115     0x0058, 0x0059, 0x005a, 0x222a, 0x2229, 0x228e, 0x2227, 0x2228,
00116     /* 0x60 */
00117     0x22a2, 0x22a3, 0x230a, 0x230b, 0x2308, 0x2309, 0x007b, 0x007d,
00118     0x2329, 0x232a, 0x007c, 0x2225, 0x2195, 0x21d5, 0x005c, 0x2240,
00119     /* 0x70 */
00120     0x221a, 0x2210, 0x2207, 0x222b, 0x2294, 0x2293, 0x2291, 0x2292,
00121     0x00a7, 0x2020, 0x2021, 0x00b6, 0x2663, 0x2666, 0x2665, 0x2660,
00122     /* 0x80 */
00123     0, 0, 0, 0, 0, 0, 0, 0,
00124     0, 0, 0, 0, 0, 0, 0, 0,
00125     /* 0x90 */
00126     0, 0, 0, 0, 0, 0, 0, 0,
00127     0, 0, 0, 0, 0, 0, 0, 0,
00128     /* 0xa0 */
00129     0, 0, 0, 0, 0, 0, 0, 0,
00130     0, 0, 0, 0, 0, 0, 0, 0,
00131     /* 0b0 */
00132     0, 0, 0, 0, 0, 0, 0, 0,
00133     0, 0, 0, 0, 0, 0, 0, 0,
00134     /* 0xc0 */
00135     0, 0, 0, 0, 0, 0, 0, 0,
00136     0, 0, 0, 0, 0, 0, 0, 0,
00137     /* 0xd0 */
00138     0, 0, 0, 0, 0, 0, 0, 0,
00139     0, 0, 0, 0, 0, 0, 0, 0,
00140     /* 0xe0 */
00141     0, 0, 0, 0, 0, 0, 0, 0,
00142     0, 0, 0, 0, 0, 0, 0, 0,
00143     /* 0xf0 */
00144     0, 0, 0, 0, 0, 0, 0, 0,
00145     0, 0, 0, 0, 0, 0, 0, 0
00146 };
00147 
00148 /* from enc/texmital.h */
00149 static uint32_t m_cm_math_italics_encoding[256] = {
00150     /* 0x00 */
00151     0x0393, 0x0394, 0x0398, 0x039b, 0x039e, 0x03a0, 0x03a3, 0x03a5,
00152     0x03a6, 0x03a8, 0x03a9, 0x03b1, 0x03b2, 0x03b3, 0x03b4, 0x03f5,
00153     /* 0x10 */
00154     0x03b6, 0x03b7, 0x03b8, 0x03b9, 0x03ba, 0x03bb, 0x03bc, 0x03bd,
00155     0x03be, 0x03c0, 0x03c1, 0x03c3, 0x03c4, 0x03c5, 0x03d5, 0x03c7,
00156     /* 0x20 */
00157     0x03c8, 0x03c9, 0x03b5, 0x03d1, 0x03d6, 0x03f1, 0x03c2, 0x03c6,
00158     0x21bc, 0x21bd, 0x21c0, 0x21c1, 0, 0, 0x22b3, 0x22b2,
00159     /* 0x30 */
00160     0xf730, 0xf731, 0xf732, 0xf733, 0xf734, 0xf735, 0xf736, 0xf737,
00161     0xf738, 0xf739, 0x002e, 0x002c, 0x003c, 0x002f, 0x003e, 0x22c6,
00162     /* 0x40 */
00163     0x2202, 0x0041, 0x0042, 0x0043, 0x0044, 0x0045, 0x0046, 0x0047,
00164     0x0048, 0x0049, 0x004a, 0x004b, 0x004c, 0x004d, 0x004e, 0x004f,
00165     /* 0x50 */
00166     0x0050, 0x0051, 0x0052, 0x0053, 0x0054, 0x0055, 0x0056, 0x0057,
00167     0x0058, 0x0059, 0x005a, 0x266d, 0x266e, 0x266f, 0x2323, 0x2322,
00168     /* 0x60 */
00169     0x2113, 0x0061, 0x0062, 0x0063, 0x0064, 0x0065, 0x0066, 0x0067,
00170     0x0068, 0x0069, 0x006a, 0x006b, 0x006c, 0x006d, 0x006e, 0x006f,
00171     /* 0x70 */
00172     0x0070, 0x0071, 0x0072, 0x0073, 0x0074, 0x0075, 0x0076, 0x0077,
00173     0x0078, 0x0079, 0x007a, 0x0131, 0xf6be, 0x2118, 0x10fffb, 0x2040,
00174     /* 0x80 */
00175     0, 0, 0, 0, 0, 0, 0, 0,
00176     0, 0, 0, 0, 0, 0, 0, 0,
00177     /* 0x90 */
00178     0, 0, 0, 0, 0, 0, 0, 0,
00179     0, 0, 0, 0, 0, 0, 0, 0,
00180     /* 0xa0 */
00181     0, 0, 0, 0, 0, 0, 0, 0,
00182     0, 0, 0, 0, 0, 0, 0, 0,
00183     /* 0xb0 */
00184     0, 0, 0, 0, 0, 0, 0, 0,
00185     0, 0, 0, 0, 0, 0, 0, 0,
00186     /* 0xc0 */
00187     0, 0, 0, 0, 0, 0, 0, 0,
00188     0, 0, 0, 0, 0, 0, 0, 0,
00189     /* 0xd0 */
00190     0, 0, 0, 0, 0, 0, 0, 0,
00191     0, 0, 0, 0, 0, 0, 0, 0,
00192     /* 0xe0 */
00193     0, 0, 0, 0, 0, 0, 0, 0,
00194     0, 0, 0, 0, 0, 0, 0, 0,
00195     /* 0xf0 */
00196     0, 0, 0, 0, 0, 0, 0, 0,
00197     0, 0, 0, 0, 0, 0, 0, 0
00198 };
00199 
00200 /* from enc/texmext.h */
00201 static uint32_t m_cm_math_extended_encoding[256] = {
00202     /* 0x00 */
00203     0x10ff00, 0x10ff01, 0x10ff02, 0x10ff03, 0x10ff04, 0x10ff05, 0x10ff06, 0x10ff07,
00204     0x10ff08, 0x10ff09, 0x10ff0a, 0x10ff0b, 0x10ff0c, 0x10ff0d, 0x10ff0e, 0x10ff0f,
00205     /* 0x10 */
00206     0x10ff10, 0x10ff11, 0x10ff12, 0x10ff13, 0x10ff14, 0x10ff15, 0x10ff16, 0x10ff17,
00207     0x10ff18, 0x10ff19, 0x10ff1a, 0x10ff1b, 0x10ff1c, 0x10ff1d, 0x10ff1e, 0x10ff1f,
00208     /* 0x20 */
00209     0x10ff20, 0x10ff21, 0x10ff22, 0x10ff23, 0x10ff24, 0x10ff25, 0x10ff26, 0x10ff27,
00210     0x10ff28, 0x10ff29, 0x10ff2a, 0x10ff2b, 0x10ff2c, 0x10ff2d, 0x10ff2e, 0x10ff2f,
00211     /* 0x30 */
00212     0xf8eb, 0xf8f6, 0xf8ee, 0xf8f9, 0xf8f0, 0xf8fb, 0xf8ef, 0xf8fa,
00213     0xf8f1, 0xf8fc, 0xf8f3, 0xf8fe, 0xf8f2, 0xf8fd, 0xf8f4, 0xf8e6,
00214     /* 0x40 */
00215     0xf8ed, 0xf8f8, 0xf8ec, 0xf8f7, 0x10ff44, 0x10ff45, 0x10ff46, 0x10ff47,
00216     0x10ff48, 0x10ff49, 0x10ff4a, 0x10ff4b, 0x10ff4c, 0x10ff4d, 0x10ff4e, 0x10ff4f,
00217     /* 0x50 */
00218     0x10ff50, 0x10ff51, 0x10ff52, 0x10ff53, 0x10ff54, 0x10ff55, 0x10ff56, 0x10ff57,
00219     0x10ff58, 0x10ff59, 0x10ff5a, 0x10ff5b, 0x10ff5c, 0x10ff5d, 0x10ff5e, 0x10ff5f,
00220     /* 0x60 */
00221     0x10ff60, 0x10ff61, 0x10ff62, 0x10ff63, 0x10ff64, 0x10ff65, 0x10ff66, 0x10ff67,
00222     0x10ff68, 0x10ff69, 0x10ff6a, 0x10ff6b, 0x10ff6c, 0x10ff6d, 0x10ff6e, 0x10ff6f,
00223     /* 0x70 */
00224     0x10ff70, 0x10ff71, 0x10ff72, 0x10ff73, 0x10ff74, 0x10ff75, 0x10ff76, 0x10ff77,
00225     0x10ff78, 0x10ff79, 0x10ff7a, 0x10ff7b, 0x10ff7c, 0x10ff7d, 0x10ff7e, 0x10ff7f,
00226     /* 0x80 */
00227     0, 0, 0, 0, 0, 0, 0, 0,
00228     0, 0, 0, 0, 0, 0, 0, 0,
00229     /* 0x90 */
00230     0, 0, 0, 0, 0, 0, 0, 0,
00231     0, 0, 0, 0, 0, 0, 0, 0,
00232     /* 0xa0 */
00233     0, 0, 0, 0, 0, 0, 0, 0,
00234     0, 0, 0, 0, 0, 0, 0, 0,
00235     /* 0xb0 */
00236     0, 0, 0, 0, 0, 0, 0, 0,
00237     0, 0, 0, 0, 0, 0, 0, 0,
00238     /* 0xc0 */
00239     0, 0, 0, 0, 0, 0, 0, 0,
00240     0, 0, 0, 0, 0, 0, 0, 0,
00241     /* 0xd0 */
00242     0, 0, 0, 0, 0, 0, 0, 0,
00243     0, 0, 0, 0, 0, 0, 0, 0,
00244     /* 0xe0 */
00245     0, 0, 0, 0, 0, 0, 0, 0,
00246     0, 0, 0, 0, 0, 0, 0, 0,
00247     /* 0xf0 */
00248     0, 0, 0, 0, 0, 0, 0, 0,
00249     0, 0, 0, 0, 0, 0, 0, 0
00250 };
00251 
00252 /* from enc/textt.h */
00253 static uint32_t m_cm_typewriter_encoding[256] = {
00254     /* 0x00 */
00255     0x0393, 0x0394, 0x0398, 0x039b, 0x039e, 0x03a0, 0x03a3, 0x03a5,
00256     0x03a6, 0x03a8, 0x03a9, 0x2191, 0x2193, 0x0027, 0x00a1, 0x00bf,
00257     /* 0x10 */
00258     0x0131, 0xf6be, 0x0060, 0x00b4, 0x02c7, 0x02d8, 0x00af, 0x02da,
00259     0x00b8, 0x00df, 0x00e6, 0x0153, 0x00f8, 0x00c6, 0x0152, 0x00d8,
00260     /* 0x20 */
00261     0x0020, 0x0021, 0x0022, 0x0023, 0x0024, 0x0025, 0x0026, 0x2019,
00262     0x0028, 0x0029, 0x002a, 0x002b, 0x002c, 0x002d, 0x002e, 0x002f,
00263     /* 0x30 */
00264     0x0030, 0x0031, 0x0032, 0x0033, 0x0034, 0x0035, 0x0036, 0x0037,
00265     0x0038, 0x0039, 0x003a, 0x003b, 0x003c, 0x003d, 0x003e, 0x003f,
00266     /* 0x40 */
00267     0x0040, 0x0041, 0x0042, 0x0043, 0x0044, 0x0045, 0x0046, 0x0047,
00268     0x0048, 0x0049, 0x004a, 0x004b, 0x004c, 0x004d, 0x004e, 0x004f,
00269     /* 0x50 */
00270     0x0050, 0x0051, 0x0052, 0x0053, 0x0054, 0x0055, 0x0056, 0x0057,
00271     0x0058, 0x0059, 0x005a, 0x005b, 0x005c, 0x005d, 0x02c6, 0x005f,
00272     /* 0x60 */
00273     0x2018, 0x0061, 0x0062, 0x0063, 0x0064, 0x0065, 0x0066, 0x0067,
00274     0x0068, 0x0069, 0x006a, 0x006b, 0x006c, 0x006d, 0x006e, 0x006f,
00275     /* 0x70 */
00276     0x0070, 0x0071, 0x0072, 0x0073, 0x0074, 0x0075, 0x0076, 0x0077,
00277     0x0078, 0x0079, 0x007a, 0x007b, 0x007c, 0x007d, 0x02dc, 0x00a8,
00278     /* 0x80 */
00279     0, 0, 0, 0, 0, 0, 0, 0,
00280     0, 0, 0, 0, 0, 0, 0, 0,
00281     /* 0x90 */
00282     0, 0, 0, 0, 0, 0, 0, 0,
00283     0, 0, 0, 0, 0, 0, 0, 0,
00284     /* 0xa0 */
00285     0, 0, 0, 0, 0, 0, 0, 0,
00286     0, 0, 0, 0, 0, 0, 0, 0,
00287     /* 0xb0 */
00288     0, 0, 0, 0, 0, 0, 0, 0,
00289     0, 0, 0, 0, 0, 0, 0, 0,
00290     /* 0xc0 */
00291     0, 0, 0, 0, 0, 0, 0, 0,
00292     0, 0, 0, 0, 0, 0, 0, 0,
00293     /* 0xd0 */
00294     0, 0, 0, 0, 0, 0, 0, 0,
00295     0, 0, 0, 0, 0, 0, 0, 0,
00296     /* 0xe0 */
00297     0, 0, 0, 0, 0, 0, 0, 0,
00298     0, 0, 0, 0, 0, 0, 0, 0,
00299     /* 0xf0 */
00300     0, 0, 0, 0, 0, 0, 0, 0,
00301     0, 0, 0, 0, 0, 0, 0, 0
00302 };
00303 
00304 /* from enc/ot1.h */
00305 static uint32_t m_ot1_encoding[256] = {
00306     /* 0x00 */
00307     0x0393, 0x0394, 0x0398, 0x039b, 0x039e, 0x03a0, 0x03a3, 0x03a5,
00308     0x03a6, 0x03a8, 0x03a9, 0xfb00, 0xfb01, 0xfb02, 0xfb03, 0xfb04,
00309     /* 0x10 */
00310     0x0131, 0xf6be, 0x0060, 0x00b4, 0x02c7, 0x02d8, 0x00af, 0x02da,
00311     0x00b8, 0x00df, 0x00e6, 0x0153, 0x00f8, 0x00c6, 0x0152, 0x00d8,
00312     /* 0x20 */
00313     0x0020, 0x0021, 0x201c, 0x0023, 0x0024, 0x0025, 0x0026, 0x2019,
00314     0x0028, 0x0029, 0x002a, 0x002b, 0x002c, 0x002d, 0x002e, 0x002f,
00315     /* 0x30 */
00316     0x0030, 0x0031, 0x0032, 0x0033, 0x0034, 0x0035, 0x0036, 0x0037,
00317     0x0038, 0x0039, 0x003a, 0x003b, 0x00a1, 0x003d, 0x00bf, 0x003f,
00318     /* 0x40 */
00319     0x0040, 0x0041, 0x0042, 0x0043, 0x0044, 0x0045, 0x0046, 0x0047,
00320     0x0048, 0x0049, 0x004a, 0x004b, 0x004c, 0x004d, 0x004e, 0x004f,
00321     /* 0x50 */
00322     0x0050, 0x0051, 0x0052, 0x0053, 0x0054, 0x0055, 0x0056, 0x0057,
00323     0x0058, 0x0059, 0x005a, 0x005b, 0x201d, 0x005d, 0x02c6, 0x02d9,
00324     /* 0x60 */
00325     0x2018, 0x0061, 0x0062, 0x0063, 0x0064, 0x0065, 0x0066, 0x0067,
00326     0x0068, 0x0069, 0x006a, 0x006b, 0x006c, 0x006d, 0x006e, 0x006f,
00327     /* 0x70 */
00328     0x0070, 0x0071, 0x0072, 0x0073, 0x0074, 0x0075, 0x0076, 0x0077,
00329     0x0078, 0x0079, 0x007a, 0x2013, 0x2014, 0x0022, 0x02dc, 0x00a8,
00330     /* 0x80 */
00331     0, 0, 0, 0, 0, 0, 0, 0,
00332     0, 0, 0, 0, 0, 0, 0, 0,
00333     /* 0x90 */
00334     0, 0, 0, 0, 0, 0, 0, 0,
00335     0, 0, 0, 0, 0, 0, 0, 0,
00336     /* 0xa0 */
00337     0, 0, 0, 0, 0, 0, 0, 0,
00338     0, 0, 0, 0, 0, 0, 0, 0,
00339     /* 0xb0 */
00340     0, 0, 0, 0, 0, 0, 0, 0,
00341     0, 0, 0, 0, 0, 0, 0, 0,
00342     /* 0xc0 */
00343     0, 0, 0, 0, 0, 0, 0, 0,
00344     0, 0, 0, 0, 0, 0, 0, 0,
00345     /* 0xd0 */
00346     0, 0, 0, 0, 0, 0, 0, 0,
00347     0, 0, 0, 0, 0, 0, 0, 0,
00348     /* 0xe0 */
00349     0, 0, 0, 0, 0, 0, 0, 0,
00350     0, 0, 0, 0, 0, 0, 0, 0,
00351     /* 0xf0 */
00352     0, 0, 0, 0, 0, 0, 0, 0,
00353     0, 0, 0, 0, 0, 0, 0, 0
00354 };
00355 
00356 /* Cyrilic e.g. fro larm1000.mf; from
00357    http://www.tug.org/tex-archive/macros/latex/contrib/t2/enc-maps/OT2uni.map */
00358 static uint32_t m_t2_encoding[256] = {
00359     0x0060, 0x00b4, 0x02c6, 0x02dc, 0x00a8, 0x02dd, 0x02da, 0x02c7,
00360     0x02d8, 0x00af, 0x02d9, 0x00b8, 0x02db, 0x04c0, 0x2329, 0x232a, 
00361     /* 0x10 */
00362     0x201c, 0x201d, 0xf6d5, 0xf6d6, 0xf6d4, 0x2013, 0x2014, 0xfeff,
00363     0x2080, 0x0131, 0xf6be, 0xfb00, 0xfb01, 0xfb02, 0xfb03, 0xfb04,
00364     /* 0x20 */
00365     0x2420, 0x0021, 0x0022, 0x0023, 0x0024, 0x0025, 0x0026, 0x2019,
00366     0x0028, 0x0029, 0x002a, 0x002b, 0x002c, 0x002d, 0x002e, 0x002f,
00367     /* 0x30 */
00368     0x0030, 0x0031, 0x0032, 0x0033, 0x0034, 0x0035, 0x0036, 0x0037,
00369     0x0038, 0x0039, 0x003a, 0x003b, 0x003c, 0x003d, 0x003e, 0x003f,
00370     /* 0x40 */
00371     0x0040, 0x0041, 0x0042, 0x0043, 0x0044, 0x0045, 0x0046, 0x0047,
00372     0x0048, 0x0049, 0x004a, 0x004b, 0x004c, 0x004d, 0x004e, 0x004f,
00373     /* 0x50 */
00374     0x0050, 0x0051, 0x0052, 0x0053, 0x0054, 0x0055, 0x0056, 0x0057,
00375     0x0058, 0x0059, 0x005a, 0x005b, 0x005c, 0x005d, 0x005e, 0x005f,
00376     /* 0x60 */
00377     0x2018, 0x0061, 0x0062, 0x0063, 0x0064, 0x0065, 0x0066, 0x0067,
00378     0x0068, 0x0069, 0x006a, 0x006b, 0x006c, 0x006d, 0x006e, 0x006f,
00379     /* 0x70 */
00380     0x0070, 0x0071, 0x0072, 0x0073, 0x0074, 0x0075, 0x0076, 0x0077,
00381     0x0078, 0x0079, 0x007a, 0x007b, 0x007c, 0x007d, 0x007e, 0x002d,
00382     /* 0x80 */
00383     0x0490, 0x0492, 0x0402, 0x040b, 0x04ba, 0x0496, 0x0498, 0x0409,
00384     0x0407, 0x049a, 0x04a0, 0x049c, 0x04d4, 0x04a2, 0x04a4, 0x0405,
00385     /* 0x90 */
00386     0x04e8, 0x04aa, 0x040e, 0x04ae, 0x04b0, 0x04b2, 0x040f, 0x04b8,
00387     0x04b6, 0x0404, 0x04d8, 0x040a, 0x0401, 0x2116, 0x00a4, 0x00a7,
00388     /* 0xa0 */
00389     0x0491, 0x0493, 0x0452, 0x045b, 0x04bb, 0x0497, 0x0499, 0x0459,
00390     0x0457, 0x049b, 0x04a1, 0x049d, 0x04d5, 0x04a3, 0x04a5, 0x0455,
00391     /* 0xb0 */
00392     0x04e9, 0x04ab, 0x045e, 0x04af, 0x04b1, 0x04b3, 0x045f, 0x04b9,
00393     0x04b7, 0x0454, 0x04d9, 0x045a, 0x0451, 0x201e, 0x00ab, 0x00bb,
00394     /* 0xc0 */
00395     0x0410, 0x0411, 0x0412, 0x0413, 0x0414, 0x0415, 0x0416, 0x0417,
00396     0x0418, 0x0419, 0x041a, 0x041b, 0x041c, 0x041d, 0x041e, 0x041f,
00397     /* 0xd0 */
00398     0x0420, 0x0421, 0x0422, 0x0423, 0x0424, 0x0425, 0x0426, 0x0427,
00399     0x0428, 0x0429, 0x042a, 0x042b, 0x042c, 0x042d, 0x042e, 0x042f,
00400     /* 0xe0 */
00401     0x0430, 0x0431, 0x0432, 0x0433, 0x0434, 0x0435, 0x0436, 0x0437,
00402     0x0438, 0x0439, 0x043a, 0x043b, 0x043c, 0x043d, 0x043e, 0x043f,
00403     /* 0xf0 */
00404     0x0440, 0x0441, 0x0442, 0x0443, 0x0444, 0x0445, 0x0446, 0x0447,
00405     0x0448, 0x0449, 0x044a, 0x044b, 0x044c, 0x044d, 0x044e, 0x044f,
00406 };
00407 
00408 /* from enc/cork.h */
00409 static uint32_t m_cork_encoding[256] = {
00410     /* 0x00 */
00411     0x0060, 0x00b4, 0x02c6, 0x02dc, 0x00a8, 0x02dd, 0x02da, 0x02c7,
00412     0x02d8, 0x00af, 0x02d9, 0x00b8, 0x02db, 0x201a, 0x2039, 0x203a,
00413     /* 0x10 */
00414     0x201c, 0x201d, 0x201e, 0x00ab, 0x00bb, 0x2013, 0x2014, 0x0020,
00415     0x0030, 0x0131, 0xf6be, 0xfb00, 0xfb01, 0xfb02, 0xfb03, 0xfb04,
00416     /* 0x20 */
00417     0x2420, 0x0021, 0x0022, 0x0023, 0x0024, 0x0025, 0x0026, 0x2019,
00418     0x0028, 0x0029, 0x002a, 0x002b, 0x002c, 0x002d, 0x002e, 0x002f,
00419     /* 0x30 */
00420     0x0030, 0x0031, 0x0032, 0x0033, 0x0034, 0x0035, 0x0036, 0x0037,
00421     0x0038, 0x0039, 0x003a, 0x003b, 0x003c, 0x003d, 0x003e, 0x003f,
00422     /* 0x40 */
00423     0x0040, 0x0041, 0x0042, 0x0043, 0x0044, 0x0045, 0x0046, 0x0047,
00424     0x0048, 0x0049, 0x004a, 0x004b, 0x004c, 0x004d, 0x004e, 0x004f,
00425     /* 0x50 */
00426     0x0050, 0x0051, 0x0052, 0x0053, 0x0054, 0x0055, 0x0056, 0x0057,
00427     0x0058, 0x0059, 0x005a, 0x005b, 0x005c, 0x005d, 0x005e, 0x005f,
00428     /* 0x60 */
00429     0x2018, 0x0061, 0x0062, 0x0063, 0x0064, 0x0065, 0x0066, 0x0067,
00430     0x0068, 0x0069, 0x006a, 0x006b, 0x006c, 0x006d, 0x006e, 0x006f,
00431     /* 0x70 */
00432     0x0070, 0x0071, 0x0072, 0x0073, 0x0074, 0x0075, 0x0076, 0x0077,
00433     0x0078, 0x0079, 0x007a, 0x007b, 0x007c, 0x007d, 0x007e, 0x002d,
00434     /* 0x80 */
00435     0x0102, 0x0104, 0x0106, 0x010c, 0x010e, 0x011a, 0x0118, 0x011e,
00436     0x0139, 0x013d, 0x0141, 0x0143, 0x0147, 0x10ffff, 0x0150, 0x0154,
00437     /* 0x90 */
00438     0x0158, 0x015a, 0x0160, 0x015e, 0x0164, 0x0162, 0x0170, 0x016e,
00439     0x0178, 0x0179, 0x017d, 0x017b, 0x0132, 0x0130, 0x0111, 0x00a7,
00440     /* 0xa0 */
00441     0x0103, 0x0105, 0x0107, 0x010d, 0x010f, 0x011b, 0x0119, 0x011f,
00442     0x013a, 0x013e, 0x0142, 0x0144, 0x0148, 0x10fffe, 0x0151, 0x0155,
00443     /* 0xb0 */
00444     0x0159, 0x015b, 0x0161, 0x015f, 0x0165, 0x0163, 0x0171, 0x016f,
00445     0x00FF, 0x017a, 0x017e, 0x017c, 0x0133, 0x00a1, 0x00bf, 0x00a3,
00446     /* 0xc0 */
00447     0x00c0, 0x00c1, 0x00c2, 0x00c3, 0x00c4, 0x00c5, 0x00c6, 0x00c7,
00448     0x00c8, 0x00c9, 0x00ca, 0x00cb, 0x00cc, 0x00cd, 0x00ce, 0x00cf,
00449     /* 0xd0 */
00450     0x00d0, 0x00d1, 0x00d2, 0x00d3, 0x00d4, 0x00d5, 0x00d6, 0x0152,
00451     0x00d8, 0x00d9, 0x00da, 0x00db, 0x00dc, 0x00dd, 0x00de, 0x10fffd,
00452     /* 0xe0 */
00453     0x00e0, 0x00e1, 0x00e2, 0x00e3, 0x00e4, 0x00e5, 0x00e6, 0x00e7,
00454     0x00e8, 0x00e9, 0x00ea, 0x00eb, 0x00ec, 0x00ed, 0x00ee, 0x00ef,
00455     /* 0xf0 */
00456     0x00f0, 0x00f1, 0x00f2, 0x00f3, 0x00f4, 0x00f5, 0x00f6, 0x0153,
00457     0x00f8, 0x00f9, 0x00fa, 0x00fb, 0x00fc, 0x00fd, 0x00fe, 0x00df
00458 };
00459 
00460 /* Newly created ts1-lm.h, which we use for TC (textcomp) fonts.
00461    This only gets the accents and stuff from iso-latin1 right; lots of
00462    the special characters aren't defined in the Adobe lookup list
00463    used by catdvi's `pse2unic'.
00464  */
00465 static uint32_t m_ts1_encoding[256] = {
00466     /* 0x00 */
00467     0x0060, 0x00b4, 0x02c6, 0x02dc, 0x00a8, 0x02dd, 0x02da, 0x02c7,
00468     0x02d8, 0, 0x02d9, 0x00b8, 0x02db, 0, 0, 0,
00469     /* 0x10 */
00470     0, 0, 0, 0, 0, 0x2013, 0xf6de, 0,
00471     0x2190, 0x2192, 0, 0, 0, 0, 0, 0,
00472     /* 0x20 */
00473     0, 0, 0, 0, 0x0024, 0, 0, 0,
00474     0, 0, 0x2217, 0, 0x002c, 0, 0x002e, 0,
00475     /* 0x30 */
00476     0xf730, 0xf731, 0xf732, 0xf733, 0xf734, 0xf735, 0xf736, 0xf737,
00477     0xf738, 0xf739, 0, 0, 0x2329, 0x2212, 0x232a, 0,
00478     /* 0x40 */
00479     0, 0, 0, 0, 0, 0, 0, 0,
00480     0, 0, 0, 0, 0, 0, 0, 0,
00481     /* 0x50 */
00482     0, 0, 0, 0, 0, 0, 0, 0,
00483     0, 0, 0, 0, 0, 0, 0x2191, 0x2193,
00484     /* 0x60 */
00485     0, 0, 0, 0, 0, 0, 0, 0,
00486     0, 0, 0, 0, 0, 0, 0x266a, 0,
00487     /* 0x70 */
00488     0, 0, 0, 0, 0, 0, 0, 0,
00489     0, 0, 0, 0, 0, 0, 0x007e, 0x003d,
00490     /* 0x80 */
00491     0, 0, 0, 0, 0x2020, 0x2021, 0, 0x2030,
00492     0x2022, 0, 0xf724, 0xf7a2, 0x0192, 0x20a1, 0, 0,
00493     /* 0x90 */
00494     0, 0, 0x20a4, 0, 0, 0, 0x20ab, 0x2122,
00495     0, 0, 0, 0, 0, 0x212e, 0x25e6, 0,
00496     /* 0xa0 */
00497     0, 0, 0x00a2, 0x00a3, 0x00a4, 0x00a5, 0x00a6, 0x00a7,
00498     0, 0x00a9, 0x00aa, 0, 0x00ac, 0, 0x00ae, 0,
00499     /* 0xb0 */
00500     0x00b0, 0x00b1, 0x00b2, 0x00b3, 0, 0, 0x00b6, 0x00b7,
00501     0, 0x00b9, 0x00ba, 0x221a, 0x00bc, 0x00bd, 0x00be, 0x20ac,
00502     /* 0xc0 */
00503     0, 0, 0, 0, 0, 0, 0, 0,
00504     0, 0, 0, 0, 0, 0, 0, 0,
00505     /* 0xd0 */
00506     0, 0, 0, 0, 0, 0, 0x00d7, 0,
00507     0, 0, 0, 0, 0, 0, 0, 0,
00508     /* 0xe0 */
00509     0, 0, 0, 0, 0, 0, 0, 0,
00510     0, 0, 0, 0, 0, 0, 0, 0,
00511     /* 0xf0 */
00512     0, 0, 0, 0, 0, 0, 0x00f7, 0,
00513     0, 0, 0, 0, 0, 0, 0, 0
00514 };
00515 
00516 /* blackletter fonts with funny encodings
00517  */
00518 static uint32_t m_yfrak_encoding[176] = {
00519     /* 0x00 */
00520     0, 0, 0, 0, 0, 0, 0, 0,
00521     0, 0, 0, 0, 0, 0, 0, 0,
00522     /* 0x10 */
00523     0x0131, 0xF6BE, 0x0060, 0x00b4, 0x02c7, 0x02d8, 0x00af, 0x02da,
00524     0x00b8, 0, 0x00df, 0, 0, 0, 0, 0,
00525     /* 0x20 */
00526     0, 0x0021, 0x0022, 0x0023, 0, 0x0025, 0, 0x2019,
00527     0x0028, 0x0029, 0x002a, 0x002b, 0x002c, 0x002d, 0x002e, 0x002f,
00528     /* 0x30 */
00529     0x0030, 0x0031, 0x0032, 0x0033, 0x0034, 0x0035, 0x0036, 0x0037,
00530     0x0038, 0x0039, 0x003a, 0, 0x003c, 0x003d, 0, 0x003f,
00531     /* 0x40 */
00532     0, 0x0041, 0x0042, 0x0043, 0x0044, 0x0045, 0x0046, 0x0047,
00533     0x0048, 0x0049, 0x004a, 0x004b, 0x004c, 0x004d, 0x004e, 0x004f,
00534     /* 0x50 */
00535     0x0050, 0x0051, 0x0052, 0x0053, 0x0054, 0x0055, 0x0056, 0x0057,
00536     0x0058, 0x0059, 0x005a, 0x005b, 0x00ab, 0x005d, 0x005e, 0x02d9,
00537     /* 0x60 */
00538     0x2018, 0x0061, 0x0062, 0x0063, 0x0064, 0x0065, 0x0066, 0x0067,
00539     0x0068, 0x0069, 0x006a, 0x006b, 0x006c, 0x006d, 0x006e, 0x006f,
00540     /* 0x70 */
00541     0x0070, 0x0071, 0x0072, 0x0073, 0x0074, 0x0075, 0x0076, 0x0077,
00542     0x0078, 0x0079, 0x007a, 0x2013, 0x2014, 0x00a8, 0x02dd, 0,
00543     /* 0x80 */ /* ch/ck ligatures treated as special cases */
00544     0, 0xfb00, 0xfb05, 0xfb00, 0xfb00, 0, 0, 0,
00545     0, 0x00e4, 0x00e4, 0, 0, 0x0073, 0, 0,
00546     /* 0x90 */
00547     0x00eb, 0x00eb, 0, 0, 0, 0, 0, 0,
00548     0, 0x00f6, 0x00f6, 0, 0, 0, 0x00fc, 0x00fc,
00549     /* 0xa0 */
00550     0, 0, 0, 0, 0x00B6, 0, 0, 0 /* sz */,
00551     0, 0, 0, 0, 0, 0, 0, 0
00552 };
00553 
00554 /*
00555   Mapping table of adobe character names (from .enc files) to Unicode IDs.
00556   Taken from catdvi's adobetbl.h; the original glyph list is available from:
00557   http://partners.adobe.com/asn/tech/type/glyphlist.txt
00558   All `private space' entries have been removed (I think they are of not
00559   much use).
00560   
00561   The names beginning with `$' have been added by the catdvi developers.
00562 
00563   Changes:
00564   - The macros DUP1/DUP2 have been #if 0'ed because I didn't understand them.
00565   - `.notdef' has been replaced by 0 to remove ambiguity with the real question mark.
00566   
00567   The list is sorted for strcmp() so that we can use bsearch() on it.
00568 */
00569 static struct adobe2unicode adobe2unicode_table[] = {
00570     { "$Delta" , 0x0394 }, /* GREEK CAPITAL LETTER DELTA; distinguish Adobe duplicates */
00571     { "$Ohm" , 0x2126 }, /* OHM SIGN; distinguish Adobe duplicates */
00572     { "$Omega" , 0x03A9 }, /* GREEK CAPITAL LETTER OMEGA; distinguish Adobe duplicates */
00573     { "$Scedilla" , 0x015E }, /* LATIN CAPITAL LETTER S WITH CEDILLA; distinguish Adobe duplicates */
00574     { "$Tcedilla", 0x0162 }, /* LATIN CAPITAL LETTER T WITH CEDILLA; distinguish Adobe duplicates */
00575     { "$Tcommaaccent", 0x021A }, /* LATIN CAPITAL LETTER T WITH COMMA BELOW; distinguish Adobe duplicates */
00576     { "$acutemodifier", 0x02CA }, /* MODIFIER LETTER ACUTE ACCENT */
00577     { "$arrowdblupdn", 0x21D5 }, /* UP DOWN DOUBLE ARROW */
00578     { "$arrownortheast", 0x2197 }, /* NORTH EAST ARROW */
00579     { "$arrownorthwest", 0x2196 }, /* NORTH WEST ARROW */
00580     { "$arrowsoutheast", 0x2198 }, /* SOUTH EAST ARROW */
00581     { "$arrowsouthwest", 0x2199 }, /* SOUTH WEST ARROW */
00582     { "$brevecomb", 0x0306 }, /* COMBINING BREVE */
00583     { "$bulletmath" , 0x2219 }, /* BULLET OPERATOR; distinguish Adobe duplicates */
00584     { "$caroncomb", 0x030C }, /* COMBINING CARON */
00585     { "$cedillacomb", 0x0327 }, /* COMBINING CEDILLA */
00586     { "$ceilingleft", 0x2308 }, /* LEFT CEILING */
00587     { "$ceilingright", 0x2309 }, /* RIGHT CEILING */
00588     { "$circlecomb", 0x20DD }, /* COMBINING ENCLOSING CIRCLE */
00589     { "$circledivide", 0x2298 }, /* CIRCLED DIVISION SLASH */
00590     { "$circledot", 0x2299 }, /* CIRCLED DOT OPERATOR */
00591     { "$circlelarge", 0x25EF }, /* LARGE CIRCLE */
00592     { "$circleminus", 0x2296 }, /* CIRCLED MINUS */
00593     { "$circumflexcomb", 0x0302 }, /* COMBINING CIRCUMFLEX ACCENT */
00594     { "$contintegral", 0x222E }, /* CONTOUR INTEGRAL */
00595     { "$coproduct", 0x2210 }, /* N-ARY COPRODUCT */
00596     { "$diamondmath", 0x22C4 }, /* DIAMOND OPERATOR */
00597     { "$dieresiscomb", 0x0308 }, /* COMBINING DIAERESIS */
00598     { "$divisionslash", 0x2215 }, /* DIVISION SLASH; distinguish Adobe duplicates */
00599     { "$dotaccentcomb", 0x0307 }, /* COMBINING DOT ABOVE */
00600     { "$epsilon1", 0x03F5 }, /* GREEK LUNATE EPSILON SYMBOL */
00601     { "$equivasymptotic", 0x224D }, /* EQUIVALENT TO */
00602     { "$flat", 0x266D }, /* MUSIC FLAT SIGN */
00603     { "$floorleft", 0x230A }, /* LEFT FLOOR */
00604     { "$floorright", 0x230B }, /* RIGHT FLOOR */
00605     { "$follows", 0x227B }, /* SUCCEEDS */
00606     { "$followsequal", 0x227D }, /* SUCCEEDS OR EQUAL TO */
00607     { "$fractionslash", 0x2044 }, /* FRACTION SLASH; distinguish Adobe duplicates */
00608     { "$frown", 0x2322 }, /* FROWN */
00609     { "$gravemodifier", 0x02CB }, /* MODIFIER LETTER GRAVE ACCENT */
00610     { "$greatermuch", 0x226B }, /* MUCH GREATER-THAN */
00611     { "$harpoonleftbarbdown", 0x21BD }, /* LEFTWARDS HARPOON WITH BARB DOWNWARDS */
00612     { "$harpoonleftbarbup", 0x21BC }, /* LEFTWARDS HARPOON WITH BARB UPWARDS */
00613     { "$harpoonrightbarbdown", 0x21C1 }, /* RIGHTWARDS HARPOON WITH BARB DOWNWARDS */
00614     { "$harpoonrightbarbup", 0x21C0 }, /* RIGHTWARDS HARPOON WITH BARB UPWARDS */
00615     { "$hyphen" , 0x002D }, /* HYPHEN-MINUS; distinguish Adobe duplicates */
00616     { "$hyphensoft" , 0x00AD }, /* SOFT HYPHEN; distinguish Adobe duplicates */
00617     { "$increment" , 0x2206 }, /* INCREMENT; distinguish Adobe duplicates */
00618     { "$intersectionsq", 0x2293 }, /* SQUARE CAP */
00619     { "$latticetop", 0x22A4 }, /* DOWN TACK */
00620     { "$lessmuch", 0x226A }, /* MUCH-LESS THAN */
00621     { "$longst", 0xFB05 }, /* LATIN SMALL LIGATURE LONG S T */
00622     { "$lscript", 0x2113 }, /* SCRIPT SMALL L; Adobe has this as "afii61289" */
00623     { "$macron", 0x00AF }, /* MACRON; distinguish Adobe duplicates */
00624     { "$macroncomb", 0x0304 }, /* COMBINING MACRON */
00625     { "$macronmodifier", 0x02C9 }, /* MODIFIER LETTER MACRON */
00626     { "$micro", 0x00B5 }, /* MICRO SIGN; distinguish Adobe duplicates */
00627     { "$minusplus", 0x2213 }, /* MINUS-OR-PLUS SIGN */
00628     { "$mu", 0x03BC }, /* GREEK SMALL LETTER MU; distinguish Adobe duplicates */
00629     { "$natural", 0x266E }, /* MUSIC NATURAL SIGN */
00630     { "$normalin", 0x22B2 }, /* NORMAL SUBGROUP OF */
00631     { "$normalizes", 0x22B3 }, /* CONTAINS AS NORMAL SUBGROUP */
00632     { "$ogonekcomb", 0x0328 }, /* COMBINING OGONEK */
00633     { "$overlinecomb", 0x0305 }, /* COMBINING OVERLINE */
00634     { "$parallel", 0x2225 }, /* PARALLEL TO */
00635     { "$periodcentered" , 0x00B7 }, /* MIDDLE DOT; distinguish Adobe duplicates */
00636     { "$pi1", 0x03D6 }, /* GREEK PI SYMBOL; Adobe has this as "omega1" which is too confusing */
00637     { "$precedes", 0x227A }, /* PRECEDES */
00638     { "$precedesequal", 0x227C }, /* PRECEDES OR EQUAL TO */
00639     { "$quotedblreversed", 0x201F }, /* DOUBLE HIGH-REVERSED-9 QUOTATION MARK */
00640     { "$reflexnormalin", 0x22B4 }, /* NORMAL SUBGROUP OF OR EQUAL TO */
00641     { "$reflexnormalizes", 0x22B5 }, /* CONTAINS AS NORMAL SUBGROUP OR EQUAL TO */
00642     { "$reflexsubsetsq", 0x2291 }, /* SQUARE IMAGE OF OR EQUAL TO */
00643     { "$reflexsupersetsq", 0x2292 }, /* SQUARE ORIGINAL OF OR EQUAL TO */
00644     { "$rho1", 0x03F1 }, /* GREEK RHO SYMBOL */
00645     { "$ringcomb", 0x030A }, /* COMBINING RING ABOVE */
00646     { "$scedilla" , 0x015F }, /* LATIN SMALL LETTER S WITH CEDILLA; distinguish Adobe duplicates */
00647     { "$sharp", 0x266F }, /* MUSIC SHARP SIGN */
00648     { "$similarequal", 0x2243 }, /* ASYMPTOTICALLY EQUAL TO */
00649     { "$slashlongcomb", 0x0338 }, /* COMBINING LONG SOLIDUS OVERLAY */
00650     { "$smile", 0x2323 }, /* SMILE */
00651     { "$space" , 0x0020 }, /* SPACE; distinguish Adobe duplicates */
00652     { "$spacenobreak" , 0x00A0 }, /* NO-BREAK SPACE; distinguish Adobe duplicates */
00653     { "$spacesymbol", 0x2420 }, /* SYMBOL FOR SPACE */
00654     { "$st", 0xFB06 }, /* LATIN SMALL LIGATURE ST */
00655     { "$starmath", 0x22C6 }, /* STAR OPERATOR */
00656     { "$tcedilla", 0x0163 }, /* LATIN SMALL LETTER T WITH CEDILLA; distinguish Adobe duplicates */
00657     { "$tcommaaccent", 0x021B }, /* LATIN SMALL LETTER T WITH COMMA BELOW; distinguish Adobe duplicates */
00658     { "$tie", 0x2040 }, /* CHARACTER TIE */
00659     { "$triagwhitedn", 0x25BD }, /* WHITE DOWN-POINTING TRIANGLE */
00660     { "$triagwhiteup", 0x25B3 }, /* WHITE UP-POINTING TRIANGLE */
00661     { "$turnstileleft", 0x22A2 }, /* RIGHT TACK */
00662     { "$turnstileright", 0x22A3 }, /* LEFT TACK */
00663     { "$unionmulti", 0x228E }, /* MULTISET UNION */
00664     { "$unionsq", 0x2294 }, /* SQUARE CUP */
00665     { "$vectorcomb", 0x20D7 }, /* COMBINING RIGHT ARROW ABOVE */
00666     { "$wreathproduct", 0x2240 }, /* WREATH PRODUCT */
00667     { ".notdef", 0 }, /* was: QUESTION MARK; changed to 0 */
00668     { "A", 0x0041 }, /* LATIN CAPITAL LETTER A */
00669     { "AE", 0x00C6 }, /* LATIN CAPITAL LETTER AE */
00670     { "AEacute", 0x01FC }, /* LATIN CAPITAL LETTER AE WITH ACUTE */
00671     { "AEsmall", 0xF7E6 }, /* LATIN SMALL CAPITAL LETTER AE */
00672     { "Aacute", 0x00C1 }, /* LATIN CAPITAL LETTER A WITH ACUTE */
00673     { "Aacutesmall", 0xF7E1 }, /* LATIN SMALL CAPITAL LETTER A WITH ACUTE */
00674     { "Abreve", 0x0102 }, /* LATIN CAPITAL LETTER A WITH BREVE */
00675     { "Acircumflex", 0x00C2 }, /* LATIN CAPITAL LETTER A WITH CIRCUMFLEX */
00676     { "Acircumflexsmall", 0xF7E2 }, /* LATIN SMALL CAPITAL LETTER A WITH CIRCUMFLEX */
00677     { "Acute", 0xF6C9 }, /* CAPITAL ACUTE ACCENT */
00678     { "Acutesmall", 0xF7B4 }, /* SMALL CAPITAL ACUTE ACCENT */
00679     { "Adieresis", 0x00C4 }, /* LATIN CAPITAL LETTER A WITH DIAERESIS */
00680     { "Adieresissmall", 0xF7E4 }, /* LATIN SMALL CAPITAL LETTER A WITH DIAERESIS */
00681     { "Agrave", 0x00C0 }, /* LATIN CAPITAL LETTER A WITH GRAVE */
00682     { "Agravesmall", 0xF7E0 }, /* LATIN SMALL CAPITAL LETTER A WITH GRAVE */
00683     { "Alpha", 0x0391 }, /* GREEK CAPITAL LETTER ALPHA */
00684     { "Alphatonos", 0x0386 }, /* GREEK CAPITAL LETTER ALPHA WITH TONOS */
00685     { "Amacron", 0x0100 }, /* LATIN CAPITAL LETTER A WITH MACRON */
00686     { "Aogonek", 0x0104 }, /* LATIN CAPITAL LETTER A WITH OGONEK */
00687     { "Aring", 0x00C5 }, /* LATIN CAPITAL LETTER A WITH RING ABOVE */
00688     { "Aringacute", 0x01FA }, /* LATIN CAPITAL LETTER A WITH RING ABOVE AND ACUTE */
00689     { "Aringsmall", 0xF7E5 }, /* LATIN SMALL CAPITAL LETTER A WITH RING ABOVE */
00690     { "Asmall", 0xF761 }, /* LATIN SMALL CAPITAL LETTER A */
00691     { "Atilde", 0x00C3 }, /* LATIN CAPITAL LETTER A WITH TILDE */
00692     { "Atildesmall", 0xF7E3 }, /* LATIN SMALL CAPITAL LETTER A WITH TILDE */
00693     { "B", 0x0042 }, /* LATIN CAPITAL LETTER B */
00694     { "Beta", 0x0392 }, /* GREEK CAPITAL LETTER BETA */
00695     { "Brevesmall", 0xF6F4 }, /* SMALL CAPITAL BREVE */
00696     { "Bsmall", 0xF762 }, /* LATIN SMALL CAPITAL LETTER B */
00697     { "C", 0x0043 }, /* LATIN CAPITAL LETTER C */
00698     { "Cacute", 0x0106 }, /* LATIN CAPITAL LETTER C WITH ACUTE */
00699     { "Caron", 0xF6CA }, /* CAPITAL CARON */
00700     { "Caronsmall", 0xF6F5 }, /* SMALL CAPITAL CARON */
00701     { "Ccaron", 0x010C }, /* LATIN CAPITAL LETTER C WITH CARON */
00702     { "Ccedilla", 0x00C7 }, /* LATIN CAPITAL LETTER C WITH CEDILLA */
00703     { "Ccedillasmall", 0xF7E7 }, /* LATIN SMALL CAPITAL LETTER C WITH CEDILLA */
00704     { "Ccircumflex", 0x0108 }, /* LATIN CAPITAL LETTER C WITH CIRCUMFLEX */
00705     { "Cdotaccent", 0x010A }, /* LATIN CAPITAL LETTER C WITH DOT ABOVE */
00706     { "Cedillasmall", 0xF7B8 }, /* SMALL CAPITAL CEDILLA */
00707     { "Chi", 0x03A7 }, /* GREEK CAPITAL LETTER CHI */
00708     { "Circumflexsmall", 0xF6F6 }, /* SMALL CAPITAL MODIFIER LETTER CIRCUMFLEX ACCENT */
00709     { "Csmall", 0xF763 }, /* LATIN SMALL CAPITAL LETTER C */
00710     { "D", 0x0044 }, /* LATIN CAPITAL LETTER D */
00711     { "Dcaron", 0x010E }, /* LATIN CAPITAL LETTER D WITH CARON */
00712     { "Dcroat", 0x0110 }, /* LATIN CAPITAL LETTER D WITH STROKE */
00713     { "Delta", 0x2206 }, /* INCREMENT */
00714 #if 0
00715     { "Delta" DUP2, 0x0394 }, /* GREEK CAPITAL LETTER DELTA;Duplicate */
00716 #endif /* 0 */
00717     { "Dieresis", 0xF6CB }, /* CAPITAL DIAERESIS */
00718     { "DieresisAcute", 0xF6CC }, /* CAPITAL DIAERESIS ACUTE ACCENT */
00719     { "DieresisGrave", 0xF6CD }, /* CAPITAL DIAERESIS GRAVE ACCENT */
00720     { "Dieresissmall", 0xF7A8 }, /* SMALL CAPITAL DIAERESIS */
00721     { "Dotaccentsmall", 0xF6F7 }, /* SMALL CAPITAL DOT ABOVE */
00722     { "Dsmall", 0xF764 }, /* LATIN SMALL CAPITAL LETTER D */
00723     { "E", 0x0045 }, /* LATIN CAPITAL LETTER E */
00724     { "Eacute", 0x00C9 }, /* LATIN CAPITAL LETTER E WITH ACUTE */
00725     { "Eacutesmall", 0xF7E9 }, /* LATIN SMALL CAPITAL LETTER E WITH ACUTE */
00726     { "Ebreve", 0x0114 }, /* LATIN CAPITAL LETTER E WITH BREVE */
00727     { "Ecaron", 0x011A }, /* LATIN CAPITAL LETTER E WITH CARON */
00728     { "Ecircumflex", 0x00CA }, /* LATIN CAPITAL LETTER E WITH CIRCUMFLEX */
00729     { "Ecircumflexsmall", 0xF7EA }, /* LATIN SMALL CAPITAL LETTER E WITH CIRCUMFLEX */
00730     { "Edieresis", 0x00CB }, /* LATIN CAPITAL LETTER E WITH DIAERESIS */
00731     { "Edieresissmall", 0xF7EB }, /* LATIN SMALL CAPITAL LETTER E WITH DIAERESIS */
00732     { "Edotaccent", 0x0116 }, /* LATIN CAPITAL LETTER E WITH DOT ABOVE */
00733     { "Egrave", 0x00C8 }, /* LATIN CAPITAL LETTER E WITH GRAVE */
00734     { "Egravesmall", 0xF7E8 }, /* LATIN SMALL CAPITAL LETTER E WITH GRAVE */
00735     { "Emacron", 0x0112 }, /* LATIN CAPITAL LETTER E WITH MACRON */
00736     { "Eng", 0x014A }, /* LATIN CAPITAL LETTER ENG */
00737     { "Eogonek", 0x0118 }, /* LATIN CAPITAL LETTER E WITH OGONEK */
00738     { "Epsilon", 0x0395 }, /* GREEK CAPITAL LETTER EPSILON */
00739     { "Epsilontonos", 0x0388 }, /* GREEK CAPITAL LETTER EPSILON WITH TONOS */
00740     { "Esmall", 0xF765 }, /* LATIN SMALL CAPITAL LETTER E */
00741     { "Eta", 0x0397 }, /* GREEK CAPITAL LETTER ETA */
00742     { "Etatonos", 0x0389 }, /* GREEK CAPITAL LETTER ETA WITH TONOS */
00743     { "Eth", 0x00D0 }, /* LATIN CAPITAL LETTER ETH */
00744     { "Ethsmall", 0xF7F0 }, /* LATIN SMALL CAPITAL LETTER ETH */
00745     { "Euro", 0x20AC }, /* EURO SIGN */
00746     { "F", 0x0046 }, /* LATIN CAPITAL LETTER F */
00747     { "Fsmall", 0xF766 }, /* LATIN SMALL CAPITAL LETTER F */
00748     { "G", 0x0047 }, /* LATIN CAPITAL LETTER G */
00749     { "Gamma", 0x0393 }, /* GREEK CAPITAL LETTER GAMMA */
00750     { "Gbreve", 0x011E }, /* LATIN CAPITAL LETTER G WITH BREVE */
00751     { "Gcaron", 0x01E6 }, /* LATIN CAPITAL LETTER G WITH CARON */
00752     { "Gcircumflex", 0x011C }, /* LATIN CAPITAL LETTER G WITH CIRCUMFLEX */
00753     { "Gcommaaccent", 0x0122 }, /* LATIN CAPITAL LETTER G WITH CEDILLA */
00754     { "Gdotaccent", 0x0120 }, /* LATIN CAPITAL LETTER G WITH DOT ABOVE */
00755     { "Grave", 0xF6CE }, /* CAPITAL GRAVE ACCENT */
00756     { "Gravesmall", 0xF760 }, /* SMALL CAPITAL GRAVE ACCENT */
00757     { "Gsmall", 0xF767 }, /* LATIN SMALL CAPITAL LETTER G */
00758     { "H", 0x0048 }, /* LATIN CAPITAL LETTER H */
00759     { "H18533", 0x25CF }, /* BLACK CIRCLE */
00760     { "H18543", 0x25AA }, /* BLACK SMALL SQUARE */
00761     { "H18551", 0x25AB }, /* WHITE SMALL SQUARE */
00762     { "H22073", 0x25A1 }, /* WHITE SQUARE */
00763     { "Hbar", 0x0126 }, /* LATIN CAPITAL LETTER H WITH STROKE */
00764     { "Hcircumflex", 0x0124 }, /* LATIN CAPITAL LETTER H WITH CIRCUMFLEX */
00765     { "Hsmall", 0xF768 }, /* LATIN SMALL CAPITAL LETTER H */
00766     { "Hungarumlaut", 0xF6CF }, /* CAPITAL DOUBLE ACUTE ACCENT */
00767     { "Hungarumlautsmall", 0xF6F8 }, /* SMALL CAPITAL DOUBLE ACUTE ACCENT */
00768     { "I", 0x0049 }, /* LATIN CAPITAL LETTER I */
00769     { "IJ", 0x0132 }, /* LATIN CAPITAL LIGATURE IJ */
00770     { "Iacute", 0x00CD }, /* LATIN CAPITAL LETTER I WITH ACUTE */
00771     { "Iacutesmall", 0xF7ED }, /* LATIN SMALL CAPITAL LETTER I WITH ACUTE */
00772     { "Ibreve", 0x012C }, /* LATIN CAPITAL LETTER I WITH BREVE */
00773     { "Icircumflex", 0x00CE }, /* LATIN CAPITAL LETTER I WITH CIRCUMFLEX */
00774     { "Icircumflexsmall", 0xF7EE }, /* LATIN SMALL CAPITAL LETTER I WITH CIRCUMFLEX */
00775     { "Idieresis", 0x00CF }, /* LATIN CAPITAL LETTER I WITH DIAERESIS */
00776     { "Idieresissmall", 0xF7EF }, /* LATIN SMALL CAPITAL LETTER I WITH DIAERESIS */
00777     { "Idotaccent", 0x0130 }, /* LATIN CAPITAL LETTER I WITH DOT ABOVE */
00778     { "Ifraktur", 0x2111 }, /* BLACK-LETTER CAPITAL I */
00779     { "Igrave", 0x00CC }, /* LATIN CAPITAL LETTER I WITH GRAVE */
00780     { "Igravesmall", 0xF7EC }, /* LATIN SMALL CAPITAL LETTER I WITH GRAVE */
00781     { "Imacron", 0x012A }, /* LATIN CAPITAL LETTER I WITH MACRON */
00782     { "Iogonek", 0x012E }, /* LATIN CAPITAL LETTER I WITH OGONEK */
00783     { "Iota", 0x0399 }, /* GREEK CAPITAL LETTER IOTA */
00784     { "Iotadieresis", 0x03AA }, /* GREEK CAPITAL LETTER IOTA WITH DIALYTIKA */
00785     { "Iotatonos", 0x038A }, /* GREEK CAPITAL LETTER IOTA WITH TONOS */
00786     { "Ismall", 0xF769 }, /* LATIN SMALL CAPITAL LETTER I */
00787     { "Itilde", 0x0128 }, /* LATIN CAPITAL LETTER I WITH TILDE */
00788     { "J", 0x004A }, /* LATIN CAPITAL LETTER J */
00789     { "Jcircumflex", 0x0134 }, /* LATIN CAPITAL LETTER J WITH CIRCUMFLEX */
00790     { "Jsmall", 0xF76A }, /* LATIN SMALL CAPITAL LETTER J */
00791     { "K", 0x004B }, /* LATIN CAPITAL LETTER K */
00792     { "Kappa", 0x039A }, /* GREEK CAPITAL LETTER KAPPA */
00793     { "Kcommaaccent", 0x0136 }, /* LATIN CAPITAL LETTER K WITH CEDILLA */
00794     { "Ksmall", 0xF76B }, /* LATIN SMALL CAPITAL LETTER K */
00795     { "L", 0x004C }, /* LATIN CAPITAL LETTER L */
00796     { "LL", 0xF6BF }, /* LATIN CAPITAL LETTER LL */
00797     { "Lacute", 0x0139 }, /* LATIN CAPITAL LETTER L WITH ACUTE */
00798     { "Lambda", 0x039B }, /* GREEK CAPITAL LETTER LAMDA */
00799     { "Lcaron", 0x013D }, /* LATIN CAPITAL LETTER L WITH CARON */
00800     { "Lcommaaccent", 0x013B }, /* LATIN CAPITAL LETTER L WITH CEDILLA */
00801     { "Ldot", 0x013F }, /* LATIN CAPITAL LETTER L WITH MIDDLE DOT */
00802     { "Lslash", 0x0141 }, /* LATIN CAPITAL LETTER L WITH STROKE */
00803     { "Lslashsmall", 0xF6F9 }, /* LATIN SMALL CAPITAL LETTER L WITH STROKE */
00804     { "Lsmall", 0xF76C }, /* LATIN SMALL CAPITAL LETTER L */
00805     { "M", 0x004D }, /* LATIN CAPITAL LETTER M */
00806     { "Macron", 0xF6D0 }, /* CAPITAL MACRON */
00807     { "Macronsmall", 0xF7AF }, /* SMALL CAPITAL MACRON */
00808     { "Msmall", 0xF76D }, /* LATIN SMALL CAPITAL LETTER M */
00809     { "Mu", 0x039C }, /* GREEK CAPITAL LETTER MU */
00810     { "N", 0x004E }, /* LATIN CAPITAL LETTER N */
00811     { "Nacute", 0x0143 }, /* LATIN CAPITAL LETTER N WITH ACUTE */
00812     { "Ncaron", 0x0147 }, /* LATIN CAPITAL LETTER N WITH CARON */
00813     { "Ncommaaccent", 0x0145 }, /* LATIN CAPITAL LETTER N WITH CEDILLA */
00814     { "Nsmall", 0xF76E }, /* LATIN SMALL CAPITAL LETTER N */
00815     { "Ntilde", 0x00D1 }, /* LATIN CAPITAL LETTER N WITH TILDE */
00816     { "Ntildesmall", 0xF7F1 }, /* LATIN SMALL CAPITAL LETTER N WITH TILDE */
00817     { "Nu", 0x039D }, /* GREEK CAPITAL LETTER NU */
00818     { "O", 0x004F }, /* LATIN CAPITAL LETTER O */
00819     { "OE", 0x0152 }, /* LATIN CAPITAL LIGATURE OE */
00820     { "OEsmall", 0xF6FA }, /* LATIN SMALL CAPITAL LIGATURE OE */
00821     { "Oacute", 0x00D3 }, /* LATIN CAPITAL LETTER O WITH ACUTE */
00822     { "Oacutesmall", 0xF7F3 }, /* LATIN SMALL CAPITAL LETTER O WITH ACUTE */
00823     { "Obreve", 0x014E }, /* LATIN CAPITAL LETTER O WITH BREVE */
00824     { "Ocircumflex", 0x00D4 }, /* LATIN CAPITAL LETTER O WITH CIRCUMFLEX */
00825     { "Ocircumflexsmall", 0xF7F4 }, /* LATIN SMALL CAPITAL LETTER O WITH CIRCUMFLEX */
00826     { "Odieresis", 0x00D6 }, /* LATIN CAPITAL LETTER O WITH DIAERESIS */
00827     { "Odieresissmall", 0xF7F6 }, /* LATIN SMALL CAPITAL LETTER O WITH DIAERESIS */
00828     { "Ogoneksmall", 0xF6FB }, /* SMALL CAPITAL OGONEK */
00829     { "Ograve", 0x00D2 }, /* LATIN CAPITAL LETTER O WITH GRAVE */
00830     { "Ogravesmall", 0xF7F2 }, /* LATIN SMALL CAPITAL LETTER O WITH GRAVE */
00831     { "Ohorn", 0x01A0 }, /* LATIN CAPITAL LETTER O WITH HORN */
00832     { "Ohungarumlaut", 0x0150 }, /* LATIN CAPITAL LETTER O WITH DOUBLE ACUTE */
00833     { "Omacron", 0x014C }, /* LATIN CAPITAL LETTER O WITH MACRON */
00834     { "Omega", 0x2126 }, /* OHM SIGN */
00835 #if 0
00836     { "Omega" DUP2, 0x03A9 }, /* GREEK CAPITAL LETTER OMEGA;Duplicate */
00837 #endif /* 0 */
00838     { "Omegatonos", 0x038F }, /* GREEK CAPITAL LETTER OMEGA WITH TONOS */
00839     { "Omicron", 0x039F }, /* GREEK CAPITAL LETTER OMICRON */
00840     { "Omicrontonos", 0x038C }, /* GREEK CAPITAL LETTER OMICRON WITH TONOS */
00841     { "Oslash", 0x00D8 }, /* LATIN CAPITAL LETTER O WITH STROKE */
00842     { "Oslashacute", 0x01FE }, /* LATIN CAPITAL LETTER O WITH STROKE AND ACUTE */
00843     { "Oslashsmall", 0xF7F8 }, /* LATIN SMALL CAPITAL LETTER O WITH STROKE */
00844     { "Osmall", 0xF76F }, /* LATIN SMALL CAPITAL LETTER O */
00845     { "Otilde", 0x00D5 }, /* LATIN CAPITAL LETTER O WITH TILDE */
00846     { "Otildesmall", 0xF7F5 }, /* LATIN SMALL CAPITAL LETTER O WITH TILDE */
00847     { "P", 0x0050 }, /* LATIN CAPITAL LETTER P */
00848     { "Phi", 0x03A6 }, /* GREEK CAPITAL LETTER PHI */
00849     { "Pi", 0x03A0 }, /* GREEK CAPITAL LETTER PI */
00850     { "Psi", 0x03A8 }, /* GREEK CAPITAL LETTER PSI */
00851     { "Psmall", 0xF770 }, /* LATIN SMALL CAPITAL LETTER P */
00852     { "Q", 0x0051 }, /* LATIN CAPITAL LETTER Q */
00853     { "Qsmall", 0xF771 }, /* LATIN SMALL CAPITAL LETTER Q */
00854     { "R", 0x0052 }, /* LATIN CAPITAL LETTER R */
00855     { "Racute", 0x0154 }, /* LATIN CAPITAL LETTER R WITH ACUTE */
00856     { "Rcaron", 0x0158 }, /* LATIN CAPITAL LETTER R WITH CARON */
00857     { "Rcommaaccent", 0x0156 }, /* LATIN CAPITAL LETTER R WITH CEDILLA */
00858     { "Rfraktur", 0x211C }, /* BLACK-LETTER CAPITAL R */
00859     { "Rho", 0x03A1 }, /* GREEK CAPITAL LETTER RHO */
00860     { "Ringsmall", 0xF6FC }, /* SMALL CAPITAL RING ABOVE */
00861     { "Rsmall", 0xF772 }, /* LATIN SMALL CAPITAL LETTER R */
00862     { "S", 0x0053 }, /* LATIN CAPITAL LETTER S */
00863     { "SF010000", 0x250C }, /* BOX DRAWINGS LIGHT DOWN AND RIGHT */
00864     { "SF020000", 0x2514 }, /* BOX DRAWINGS LIGHT UP AND RIGHT */
00865     { "SF030000", 0x2510 }, /* BOX DRAWINGS LIGHT DOWN AND LEFT */
00866     { "SF040000", 0x2518 }, /* BOX DRAWINGS LIGHT UP AND LEFT */
00867     { "SF050000", 0x253C }, /* BOX DRAWINGS LIGHT VERTICAL AND HORIZONTAL */
00868     { "SF060000", 0x252C }, /* BOX DRAWINGS LIGHT DOWN AND HORIZONTAL */
00869     { "SF070000", 0x2534 }, /* BOX DRAWINGS LIGHT UP AND HORIZONTAL */
00870     { "SF080000", 0x251C }, /* BOX DRAWINGS LIGHT VERTICAL AND RIGHT */
00871     { "SF090000", 0x2524 }, /* BOX DRAWINGS LIGHT VERTICAL AND LEFT */
00872     { "SF100000", 0x2500 }, /* BOX DRAWINGS LIGHT HORIZONTAL */
00873     { "SF110000", 0x2502 }, /* BOX DRAWINGS LIGHT VERTICAL */
00874     { "SF190000", 0x2561 }, /* BOX DRAWINGS VERTICAL SINGLE AND LEFT DOUBLE */
00875     { "SF200000", 0x2562 }, /* BOX DRAWINGS VERTICAL DOUBLE AND LEFT SINGLE */
00876     { "SF210000", 0x2556 }, /* BOX DRAWINGS DOWN DOUBLE AND LEFT SINGLE */
00877     { "SF220000", 0x2555 }, /* BOX DRAWINGS DOWN SINGLE AND LEFT DOUBLE */
00878     { "SF230000", 0x2563 }, /* BOX DRAWINGS DOUBLE VERTICAL AND LEFT */
00879     { "SF240000", 0x2551 }, /* BOX DRAWINGS DOUBLE VERTICAL */
00880     { "SF250000", 0x2557 }, /* BOX DRAWINGS DOUBLE DOWN AND LEFT */
00881     { "SF260000", 0x255D }, /* BOX DRAWINGS DOUBLE UP AND LEFT */
00882     { "SF270000", 0x255C }, /* BOX DRAWINGS UP DOUBLE AND LEFT SINGLE */
00883     { "SF280000", 0x255B }, /* BOX DRAWINGS UP SINGLE AND LEFT DOUBLE */
00884     { "SF360000", 0x255E }, /* BOX DRAWINGS VERTICAL SINGLE AND RIGHT DOUBLE */
00885     { "SF370000", 0x255F }, /* BOX DRAWINGS VERTICAL DOUBLE AND RIGHT SINGLE */
00886     { "SF380000", 0x255A }, /* BOX DRAWINGS DOUBLE UP AND RIGHT */
00887     { "SF390000", 0x2554 }, /* BOX DRAWINGS DOUBLE DOWN AND RIGHT */
00888     { "SF400000", 0x2569 }, /* BOX DRAWINGS DOUBLE UP AND HORIZONTAL */
00889     { "SF410000", 0x2566 }, /* BOX DRAWINGS DOUBLE DOWN AND HORIZONTAL */
00890     { "SF420000", 0x2560 }, /* BOX DRAWINGS DOUBLE VERTICAL AND RIGHT */
00891     { "SF430000", 0x2550 }, /* BOX DRAWINGS DOUBLE HORIZONTAL */
00892     { "SF440000", 0x256C }, /* BOX DRAWINGS DOUBLE VERTICAL AND HORIZONTAL */
00893     { "SF450000", 0x2567 }, /* BOX DRAWINGS UP SINGLE AND HORIZONTAL DOUBLE */
00894     { "SF460000", 0x2568 }, /* BOX DRAWINGS UP DOUBLE AND HORIZONTAL SINGLE */
00895     { "SF470000", 0x2564 }, /* BOX DRAWINGS DOWN SINGLE AND HORIZONTAL DOUBLE */
00896     { "SF480000", 0x2565 }, /* BOX DRAWINGS DOWN DOUBLE AND HORIZONTAL SINGLE */
00897     { "SF490000", 0x2559 }, /* BOX DRAWINGS UP DOUBLE AND RIGHT SINGLE */
00898     { "SF500000", 0x2558 }, /* BOX DRAWINGS UP SINGLE AND RIGHT DOUBLE */
00899     { "SF510000", 0x2552 }, /* BOX DRAWINGS DOWN SINGLE AND RIGHT DOUBLE */
00900     { "SF520000", 0x2553 }, /* BOX DRAWINGS DOWN DOUBLE AND RIGHT SINGLE */
00901     { "SF530000", 0x256B }, /* BOX DRAWINGS VERTICAL DOUBLE AND HORIZONTAL SINGLE */
00902     { "SF540000", 0x256A }, /* BOX DRAWINGS VERTICAL SINGLE AND HORIZONTAL DOUBLE */
00903     { "Sacute", 0x015A }, /* LATIN CAPITAL LETTER S WITH ACUTE */
00904     { "Scaron", 0x0160 }, /* LATIN CAPITAL LETTER S WITH CARON */
00905     { "Scaronsmall", 0xF6FD }, /* LATIN SMALL CAPITAL LETTER S WITH CARON */
00906     { "Scedilla", 0x015E }, /* LATIN CAPITAL LETTER S WITH CEDILLA */
00907 #if 0
00908     { "Scedilla" DUP2, 0xF6C1 }, /* LATIN CAPITAL LETTER S WITH CEDILLA;Duplicate */
00909 #endif /* 0 */
00910     { "Scircumflex", 0x015C }, /* LATIN CAPITAL LETTER S WITH CIRCUMFLEX */
00911     { "Scommaaccent", 0x0218 }, /* LATIN CAPITAL LETTER S WITH COMMA BELOW */
00912     { "Sigma", 0x03A3 }, /* GREEK CAPITAL LETTER SIGMA */
00913     { "Ssmall", 0xF773 }, /* LATIN SMALL CAPITAL LETTER S */
00914     { "T", 0x0054 }, /* LATIN CAPITAL LETTER T */
00915     { "Tau", 0x03A4 }, /* GREEK CAPITAL LETTER TAU */
00916     { "Tbar", 0x0166 }, /* LATIN CAPITAL LETTER T WITH STROKE */
00917     { "Tcaron", 0x0164 }, /* LATIN CAPITAL LETTER T WITH CARON */
00918     { "Tcommaaccent", 0x0162 }, /* LATIN CAPITAL LETTER T WITH CEDILLA */
00919 #if 0
00920     { "Tcommaaccent" DUP2, 0x021A }, /* LATIN CAPITAL LETTER T WITH COMMA BELOW;Duplicate */
00921 #endif /* 0 */
00922     { "Theta", 0x0398 }, /* GREEK CAPITAL LETTER THETA */
00923     { "Thorn", 0x00DE }, /* LATIN CAPITAL LETTER THORN */
00924     { "Thornsmall", 0xF7FE }, /* LATIN SMALL CAPITAL LETTER THORN */
00925     { "Tildesmall", 0xF6FE }, /* SMALL CAPITAL SMALL TILDE */
00926     { "Tsmall", 0xF774 }, /* LATIN SMALL CAPITAL LETTER T */
00927     { "U", 0x0055 }, /* LATIN CAPITAL LETTER U */
00928     { "Uacute", 0x00DA }, /* LATIN CAPITAL LETTER U WITH ACUTE */
00929     { "Uacutesmall", 0xF7FA }, /* LATIN SMALL CAPITAL LETTER U WITH ACUTE */
00930     { "Ubreve", 0x016C }, /* LATIN CAPITAL LETTER U WITH BREVE */
00931     { "Ucircumflex", 0x00DB }, /* LATIN CAPITAL LETTER U WITH CIRCUMFLEX */
00932     { "Ucircumflexsmall", 0xF7FB }, /* LATIN SMALL CAPITAL LETTER U WITH CIRCUMFLEX */
00933     { "Udieresis", 0x00DC }, /* LATIN CAPITAL LETTER U WITH DIAERESIS */
00934     { "Udieresissmall", 0xF7FC }, /* LATIN SMALL CAPITAL LETTER U WITH DIAERESIS */
00935     { "Ugrave", 0x00D9 }, /* LATIN CAPITAL LETTER U WITH GRAVE */
00936     { "Ugravesmall", 0xF7F9 }, /* LATIN SMALL CAPITAL LETTER U WITH GRAVE */
00937     { "Uhorn", 0x01AF }, /* LATIN CAPITAL LETTER U WITH HORN */
00938     { "Uhungarumlaut", 0x0170 }, /* LATIN CAPITAL LETTER U WITH DOUBLE ACUTE */
00939     { "Umacron", 0x016A }, /* LATIN CAPITAL LETTER U WITH MACRON */
00940     { "Uogonek", 0x0172 }, /* LATIN CAPITAL LETTER U WITH OGONEK */
00941     { "Upsilon", 0x03A5 }, /* GREEK CAPITAL LETTER UPSILON */
00942     { "Upsilon1", 0x03D2 }, /* GREEK UPSILON WITH HOOK SYMBOL */
00943     { "Upsilondieresis", 0x03AB }, /* GREEK CAPITAL LETTER UPSILON WITH DIALYTIKA */
00944     { "Upsilontonos", 0x038E }, /* GREEK CAPITAL LETTER UPSILON WITH TONOS */
00945     { "Uring", 0x016E }, /* LATIN CAPITAL LETTER U WITH RING ABOVE */
00946     { "Usmall", 0xF775 }, /* LATIN SMALL CAPITAL LETTER U */
00947     { "Utilde", 0x0168 }, /* LATIN CAPITAL LETTER U WITH TILDE */
00948     { "V", 0x0056 }, /* LATIN CAPITAL LETTER V */
00949     { "Vsmall", 0xF776 }, /* LATIN SMALL CAPITAL LETTER V */
00950     { "W", 0x0057 }, /* LATIN CAPITAL LETTER W */
00951     { "Wacute", 0x1E82 }, /* LATIN CAPITAL LETTER W WITH ACUTE */
00952     { "Wcircumflex", 0x0174 }, /* LATIN CAPITAL LETTER W WITH CIRCUMFLEX */
00953     { "Wdieresis", 0x1E84 }, /* LATIN CAPITAL LETTER W WITH DIAERESIS */
00954     { "Wgrave", 0x1E80 }, /* LATIN CAPITAL LETTER W WITH GRAVE */
00955     { "Wsmall", 0xF777 }, /* LATIN SMALL CAPITAL LETTER W */
00956     { "X", 0x0058 }, /* LATIN CAPITAL LETTER X */
00957     { "Xi", 0x039E }, /* GREEK CAPITAL LETTER XI */
00958     { "Xsmall", 0xF778 }, /* LATIN SMALL CAPITAL LETTER X */
00959     { "Y", 0x0059 }, /* LATIN CAPITAL LETTER Y */
00960     { "Yacute", 0x00DD }, /* LATIN CAPITAL LETTER Y WITH ACUTE */
00961     { "Yacutesmall", 0xF7FD }, /* LATIN SMALL CAPITAL LETTER Y WITH ACUTE */
00962     { "Ycircumflex", 0x0176 }, /* LATIN CAPITAL LETTER Y WITH CIRCUMFLEX */
00963     { "Ydieresis", 0x0178 }, /* LATIN CAPITAL LETTER Y WITH DIAERESIS */
00964     { "Ydieresissmall", 0xF7FF }, /* LATIN SMALL CAPITAL LETTER Y WITH DIAERESIS */
00965     { "Ygrave", 0x1EF2 }, /* LATIN CAPITAL LETTER Y WITH GRAVE */
00966     { "Ysmall", 0xF779 }, /* LATIN SMALL CAPITAL LETTER Y */
00967     { "Z", 0x005A }, /* LATIN CAPITAL LETTER Z */
00968     { "Zacute", 0x0179 }, /* LATIN CAPITAL LETTER Z WITH ACUTE */
00969     { "Zcaron", 0x017D }, /* LATIN CAPITAL LETTER Z WITH CARON */
00970     { "Zcaronsmall", 0xF6FF }, /* LATIN SMALL CAPITAL LETTER Z WITH CARON */
00971     { "Zdotaccent", 0x017B }, /* LATIN CAPITAL LETTER Z WITH DOT ABOVE */
00972     { "Zeta", 0x0396 }, /* GREEK CAPITAL LETTER ZETA */
00973     { "Zsmall", 0xF77A }, /* LATIN SMALL CAPITAL LETTER Z */
00974     { "a", 0x0061 }, /* LATIN SMALL LETTER A */
00975     { "aacute", 0x00E1 }, /* LATIN SMALL LETTER A WITH ACUTE */
00976     { "abreve", 0x0103 }, /* LATIN SMALL LETTER A WITH BREVE */
00977     { "acircumflex", 0x00E2 }, /* LATIN SMALL LETTER A WITH CIRCUMFLEX */
00978     { "acute", 0x00B4 }, /* ACUTE ACCENT */
00979     { "acutecomb", 0x0301 }, /* COMBINING ACUTE ACCENT */
00980     { "adieresis", 0x00E4 }, /* LATIN SMALL LETTER A WITH DIAERESIS */
00981     { "ae", 0x00E6 }, /* LATIN SMALL LETTER AE */
00982     { "aeacute", 0x01FD }, /* LATIN SMALL LETTER AE WITH ACUTE */
00983     { "afii00208", 0x2015 }, /* HORIZONTAL BAR */
00984     { "afii10017", 0x0410 }, /* CYRILLIC CAPITAL LETTER A */
00985     { "afii10018", 0x0411 }, /* CYRILLIC CAPITAL LETTER BE */
00986     { "afii10019", 0x0412 }, /* CYRILLIC CAPITAL LETTER VE */
00987     { "afii10020", 0x0413 }, /* CYRILLIC CAPITAL LETTER GHE */
00988     { "afii10021", 0x0414 }, /* CYRILLIC CAPITAL LETTER DE */
00989     { "afii10022", 0x0415 }, /* CYRILLIC CAPITAL LETTER IE */
00990     { "afii10023", 0x0401 }, /* CYRILLIC CAPITAL LETTER IO */
00991     { "afii10024", 0x0416 }, /* CYRILLIC CAPITAL LETTER ZHE */
00992     { "afii10025", 0x0417 }, /* CYRILLIC CAPITAL LETTER ZE */
00993     { "afii10026", 0x0418 }, /* CYRILLIC CAPITAL LETTER I */
00994     { "afii10027", 0x0419 }, /* CYRILLIC CAPITAL LETTER SHORT I */
00995     { "afii10028", 0x041A }, /* CYRILLIC CAPITAL LETTER KA */
00996     { "afii10029", 0x041B }, /* CYRILLIC CAPITAL LETTER EL */
00997     { "afii10030", 0x041C }, /* CYRILLIC CAPITAL LETTER EM */
00998     { "afii10031", 0x041D }, /* CYRILLIC CAPITAL LETTER EN */
00999     { "afii10032", 0x041E }, /* CYRILLIC CAPITAL LETTER O */
01000     { "afii10033", 0x041F }, /* CYRILLIC CAPITAL LETTER PE */
01001     { "afii10034", 0x0420 }, /* CYRILLIC CAPITAL LETTER ER */
01002     { "afii10035", 0x0421 }, /* CYRILLIC CAPITAL LETTER ES */
01003     { "afii10036", 0x0422 }, /* CYRILLIC CAPITAL LETTER TE */
01004     { "afii10037", 0x0423 }, /* CYRILLIC CAPITAL LETTER U */
01005     { "afii10038", 0x0424 }, /* CYRILLIC CAPITAL LETTER EF */
01006     { "afii10039", 0x0425 }, /* CYRILLIC CAPITAL LETTER HA */
01007     { "afii10040", 0x0426 }, /* CYRILLIC CAPITAL LETTER TSE */
01008     { "afii10041", 0x0427 }, /* CYRILLIC CAPITAL LETTER CHE */
01009     { "afii10042", 0x0428 }, /* CYRILLIC CAPITAL LETTER SHA */
01010     { "afii10043", 0x0429 }, /* CYRILLIC CAPITAL LETTER SHCHA */
01011     { "afii10044", 0x042A }, /* CYRILLIC CAPITAL LETTER HARD SIGN */
01012     { "afii10045", 0x042B }, /* CYRILLIC CAPITAL LETTER YERU */
01013     { "afii10046", 0x042C }, /* CYRILLIC CAPITAL LETTER SOFT SIGN */
01014     { "afii10047", 0x042D }, /* CYRILLIC CAPITAL LETTER E */
01015     { "afii10048", 0x042E }, /* CYRILLIC CAPITAL LETTER YU */
01016     { "afii10049", 0x042F }, /* CYRILLIC CAPITAL LETTER YA */
01017     { "afii10050", 0x0490 }, /* CYRILLIC CAPITAL LETTER GHE WITH UPTURN */
01018     { "afii10051", 0x0402 }, /* CYRILLIC CAPITAL LETTER DJE */
01019     { "afii10052", 0x0403 }, /* CYRILLIC CAPITAL LETTER GJE */
01020     { "afii10053", 0x0404 }, /* CYRILLIC CAPITAL LETTER UKRAINIAN IE */
01021     { "afii10054", 0x0405 }, /* CYRILLIC CAPITAL LETTER DZE */
01022     { "afii10055", 0x0406 }, /* CYRILLIC CAPITAL LETTER BYELORUSSIAN-UKRAINIAN I */
01023     { "afii10056", 0x0407 }, /* CYRILLIC CAPITAL LETTER YI */
01024     { "afii10057", 0x0408 }, /* CYRILLIC CAPITAL LETTER JE */
01025     { "afii10058", 0x0409 }, /* CYRILLIC CAPITAL LETTER LJE */
01026     { "afii10059", 0x040A }, /* CYRILLIC CAPITAL LETTER NJE */
01027     { "afii10060", 0x040B }, /* CYRILLIC CAPITAL LETTER TSHE */
01028     { "afii10061", 0x040C }, /* CYRILLIC CAPITAL LETTER KJE */
01029     { "afii10062", 0x040E }, /* CYRILLIC CAPITAL LETTER SHORT U */
01030     { "afii10063", 0xF6C4 }, /* CYRILLIC SMALL LETTER GHE VARIANT */
01031     { "afii10064", 0xF6C5 }, /* CYRILLIC SMALL LETTER BE VARIANT */
01032     { "afii10065", 0x0430 }, /* CYRILLIC SMALL LETTER A */
01033     { "afii10066", 0x0431 }, /* CYRILLIC SMALL LETTER BE */
01034     { "afii10067", 0x0432 }, /* CYRILLIC SMALL LETTER VE */
01035     { "afii10068", 0x0433 }, /* CYRILLIC SMALL LETTER GHE */
01036     { "afii10069", 0x0434 }, /* CYRILLIC SMALL LETTER DE */
01037     { "afii10070", 0x0435 }, /* CYRILLIC SMALL LETTER IE */
01038     { "afii10071", 0x0451 }, /* CYRILLIC SMALL LETTER IO */
01039     { "afii10072", 0x0436 }, /* CYRILLIC SMALL LETTER ZHE */
01040     { "afii10073", 0x0437 }, /* CYRILLIC SMALL LETTER ZE */
01041     { "afii10074", 0x0438 }, /* CYRILLIC SMALL LETTER I */
01042     { "afii10075", 0x0439 }, /* CYRILLIC SMALL LETTER SHORT I */
01043     { "afii10076", 0x043A }, /* CYRILLIC SMALL LETTER KA */
01044     { "afii10077", 0x043B }, /* CYRILLIC SMALL LETTER EL */
01045     { "afii10078", 0x043C }, /* CYRILLIC SMALL LETTER EM */
01046     { "afii10079", 0x043D }, /* CYRILLIC SMALL LETTER EN */
01047     { "afii10080", 0x043E }, /* CYRILLIC SMALL LETTER O */
01048     { "afii10081", 0x043F }, /* CYRILLIC SMALL LETTER PE */
01049     { "afii10082", 0x0440 }, /* CYRILLIC SMALL LETTER ER */
01050     { "afii10083", 0x0441 }, /* CYRILLIC SMALL LETTER ES */
01051     { "afii10084", 0x0442 }, /* CYRILLIC SMALL LETTER TE */
01052     { "afii10085", 0x0443 }, /* CYRILLIC SMALL LETTER U */
01053     { "afii10086", 0x0444 }, /* CYRILLIC SMALL LETTER EF */
01054     { "afii10087", 0x0445 }, /* CYRILLIC SMALL LETTER HA */
01055     { "afii10088", 0x0446 }, /* CYRILLIC SMALL LETTER TSE */
01056     { "afii10089", 0x0447 }, /* CYRILLIC SMALL LETTER CHE */
01057     { "afii10090", 0x0448 }, /* CYRILLIC SMALL LETTER SHA */
01058     { "afii10091", 0x0449 }, /* CYRILLIC SMALL LETTER SHCHA */
01059     { "afii10092", 0x044A }, /* CYRILLIC SMALL LETTER HARD SIGN */
01060     { "afii10093", 0x044B }, /* CYRILLIC SMALL LETTER YERU */
01061     { "afii10094", 0x044C }, /* CYRILLIC SMALL LETTER SOFT SIGN */
01062     { "afii10095", 0x044D }, /* CYRILLIC SMALL LETTER E */
01063     { "afii10096", 0x044E }, /* CYRILLIC SMALL LETTER YU */
01064     { "afii10097", 0x044F }, /* CYRILLIC SMALL LETTER YA */
01065     { "afii10098", 0x0491 }, /* CYRILLIC SMALL LETTER GHE WITH UPTURN */
01066     { "afii10099", 0x0452 }, /* CYRILLIC SMALL LETTER DJE */
01067     { "afii10100", 0x0453 }, /* CYRILLIC SMALL LETTER GJE */
01068     { "afii10101", 0x0454 }, /* CYRILLIC SMALL LETTER UKRAINIAN IE */
01069     { "afii10102", 0x0455 }, /* CYRILLIC SMALL LETTER DZE */
01070     { "afii10103", 0x0456 }, /* CYRILLIC SMALL LETTER BYELORUSSIAN-UKRAINIAN I */
01071     { "afii10104", 0x0457 }, /* CYRILLIC SMALL LETTER YI */
01072     { "afii10105", 0x0458 }, /* CYRILLIC SMALL LETTER JE */
01073     { "afii10106", 0x0459 }, /* CYRILLIC SMALL LETTER LJE */
01074     { "afii10107", 0x045A }, /* CYRILLIC SMALL LETTER NJE */
01075     { "afii10108", 0x045B }, /* CYRILLIC SMALL LETTER TSHE */
01076     { "afii10109", 0x045C }, /* CYRILLIC SMALL LETTER KJE */
01077     { "afii10110", 0x045E }, /* CYRILLIC SMALL LETTER SHORT U */
01078     { "afii10145", 0x040F }, /* CYRILLIC CAPITAL LETTER DZHE */
01079     { "afii10146", 0x0462 }, /* CYRILLIC CAPITAL LETTER YAT */
01080     { "afii10147", 0x0472 }, /* CYRILLIC CAPITAL LETTER FITA */
01081     { "afii10148", 0x0474 }, /* CYRILLIC CAPITAL LETTER IZHITSA */
01082     { "afii10192", 0xF6C6 }, /* CYRILLIC SMALL LETTER DE VARIANT */
01083     { "afii10193", 0x045F }, /* CYRILLIC SMALL LETTER DZHE */
01084     { "afii10194", 0x0463 }, /* CYRILLIC SMALL LETTER YAT */
01085     { "afii10195", 0x0473 }, /* CYRILLIC SMALL LETTER FITA */
01086     { "afii10196", 0x0475 }, /* CYRILLIC SMALL LETTER IZHITSA */
01087     { "afii10831", 0xF6C7 }, /* CYRILLIC SMALL LETTER PE VARIANT */
01088     { "afii10832", 0xF6C8 }, /* CYRILLIC SMALL LETTER TE VARIANT */
01089     { "afii10846", 0x04D9 }, /* CYRILLIC SMALL LETTER SCHWA */
01090     { "afii299", 0x200E }, /* LEFT-TO-RIGHT MARK */
01091     { "afii300", 0x200F }, /* RIGHT-TO-LEFT MARK */
01092     { "afii301", 0x200D }, /* ZERO WIDTH JOINER */
01093     { "afii57381", 0x066A }, /* ARABIC PERCENT SIGN */
01094     { "afii57388", 0x060C }, /* ARABIC COMMA */
01095     { "afii57392", 0x0660 }, /* ARABIC-INDIC DIGIT ZERO */
01096     { "afii57393", 0x0661 }, /* ARABIC-INDIC DIGIT ONE */
01097     { "afii57394", 0x0662 }, /* ARABIC-INDIC DIGIT TWO */
01098     { "afii57395", 0x0663 }, /* ARABIC-INDIC DIGIT THREE */
01099     { "afii57396", 0x0664 }, /* ARABIC-INDIC DIGIT FOUR */
01100     { "afii57397", 0x0665 }, /* ARABIC-INDIC DIGIT FIVE */
01101     { "afii57398", 0x0666 }, /* ARABIC-INDIC DIGIT SIX */
01102     { "afii57399", 0x0667 }, /* ARABIC-INDIC DIGIT SEVEN */
01103     { "afii57400", 0x0668 }, /* ARABIC-INDIC DIGIT EIGHT */
01104     { "afii57401", 0x0669 }, /* ARABIC-INDIC DIGIT NINE */
01105     { "afii57403", 0x061B }, /* ARABIC SEMICOLON */
01106     { "afii57407", 0x061F }, /* ARABIC QUESTION MARK */
01107     { "afii57409", 0x0621 }, /* ARABIC LETTER HAMZA */
01108     { "afii57410", 0x0622 }, /* ARABIC LETTER ALEF WITH MADDA ABOVE */
01109     { "afii57411", 0x0623 }, /* ARABIC LETTER ALEF WITH HAMZA ABOVE */
01110     { "afii57412", 0x0624 }, /* ARABIC LETTER WAW WITH HAMZA ABOVE */
01111     { "afii57413", 0x0625 }, /* ARABIC LETTER ALEF WITH HAMZA BELOW */
01112     { "afii57414", 0x0626 }, /* ARABIC LETTER YEH WITH HAMZA ABOVE */
01113     { "afii57415", 0x0627 }, /* ARABIC LETTER ALEF */
01114     { "afii57416", 0x0628 }, /* ARABIC LETTER BEH */
01115     { "afii57417", 0x0629 }, /* ARABIC LETTER TEH MARBUTA */
01116     { "afii57418", 0x062A }, /* ARABIC LETTER TEH */
01117     { "afii57419", 0x062B }, /* ARABIC LETTER THEH */
01118     { "afii57420", 0x062C }, /* ARABIC LETTER JEEM */
01119     { "afii57421", 0x062D }, /* ARABIC LETTER HAH */
01120     { "afii57422", 0x062E }, /* ARABIC LETTER KHAH */
01121     { "afii57423", 0x062F }, /* ARABIC LETTER DAL */
01122     { "afii57424", 0x0630 }, /* ARABIC LETTER THAL */
01123     { "afii57425", 0x0631 }, /* ARABIC LETTER REH */
01124     { "afii57426", 0x0632 }, /* ARABIC LETTER ZAIN */
01125     { "afii57427", 0x0633 }, /* ARABIC LETTER SEEN */
01126     { "afii57428", 0x0634 }, /* ARABIC LETTER SHEEN */
01127     { "afii57429", 0x0635 }, /* ARABIC LETTER SAD */
01128     { "afii57430", 0x0636 }, /* ARABIC LETTER DAD */
01129     { "afii57431", 0x0637 }, /* ARABIC LETTER TAH */
01130     { "afii57432", 0x0638 }, /* ARABIC LETTER ZAH */
01131     { "afii57433", 0x0639 }, /* ARABIC LETTER AIN */
01132     { "afii57434", 0x063A }, /* ARABIC LETTER GHAIN */
01133     { "afii57440", 0x0640 }, /* ARABIC TATWEEL */
01134     { "afii57441", 0x0641 }, /* ARABIC LETTER FEH */
01135     { "afii57442", 0x0642 }, /* ARABIC LETTER QAF */
01136     { "afii57443", 0x0643 }, /* ARABIC LETTER KAF */
01137     { "afii57444", 0x0644 }, /* ARABIC LETTER LAM */
01138     { "afii57445", 0x0645 }, /* ARABIC LETTER MEEM */
01139     { "afii57446", 0x0646 }, /* ARABIC LETTER NOON */
01140     { "afii57448", 0x0648 }, /* ARABIC LETTER WAW */
01141     { "afii57449", 0x0649 }, /* ARABIC LETTER ALEF MAKSURA */
01142     { "afii57450", 0x064A }, /* ARABIC LETTER YEH */
01143     { "afii57451", 0x064B }, /* ARABIC FATHATAN */
01144     { "afii57452", 0x064C }, /* ARABIC DAMMATAN */
01145     { "afii57453", 0x064D }, /* ARABIC KASRATAN */
01146     { "afii57454", 0x064E }, /* ARABIC FATHA */
01147     { "afii57455", 0x064F }, /* ARABIC DAMMA */
01148     { "afii57456", 0x0650 }, /* ARABIC KASRA */
01149     { "afii57457", 0x0651 }, /* ARABIC SHADDA */
01150     { "afii57458", 0x0652 }, /* ARABIC SUKUN */
01151     { "afii57470", 0x0647 }, /* ARABIC LETTER HEH */
01152     { "afii57505", 0x06A4 }, /* ARABIC LETTER VEH */
01153     { "afii57506", 0x067E }, /* ARABIC LETTER PEH */
01154     { "afii57507", 0x0686 }, /* ARABIC LETTER TCHEH */
01155     { "afii57508", 0x0698 }, /* ARABIC LETTER JEH */
01156     { "afii57509", 0x06AF }, /* ARABIC LETTER GAF */
01157     { "afii57511", 0x0679 }, /* ARABIC LETTER TTEH */
01158     { "afii57512", 0x0688 }, /* ARABIC LETTER DDAL */
01159     { "afii57513", 0x0691 }, /* ARABIC LETTER RREH */
01160     { "afii57514", 0x06BA }, /* ARABIC LETTER NOON GHUNNA */
01161     { "afii57519", 0x06D2 }, /* ARABIC LETTER YEH BARREE */
01162     { "afii57534", 0x06D5 }, /* ARABIC LETTER AE */
01163     { "afii57636", 0x20AA }, /* NEW SHEQEL SIGN */
01164     { "afii57645", 0x05BE }, /* HEBREW PUNCTUATION MAQAF */
01165     { "afii57658", 0x05C3 }, /* HEBREW PUNCTUATION SOF PASUQ */
01166     { "afii57664", 0x05D0 }, /* HEBREW LETTER ALEF */
01167     { "afii57665", 0x05D1 }, /* HEBREW LETTER BET */
01168     { "afii57666", 0x05D2 }, /* HEBREW LETTER GIMEL */
01169     { "afii57667", 0x05D3 }, /* HEBREW LETTER DALET */
01170     { "afii57668", 0x05D4 }, /* HEBREW LETTER HE */
01171     { "afii57669", 0x05D5 }, /* HEBREW LETTER VAV */
01172     { "afii57670", 0x05D6 }, /* HEBREW LETTER ZAYIN */
01173     { "afii57671", 0x05D7 }, /* HEBREW LETTER HET */
01174     { "afii57672", 0x05D8 }, /* HEBREW LETTER TET */
01175     { "afii57673", 0x05D9 }, /* HEBREW LETTER YOD */
01176     { "afii57674", 0x05DA }, /* HEBREW LETTER FINAL KAF */
01177     { "afii57675", 0x05DB }, /* HEBREW LETTER KAF */
01178     { "afii57676", 0x05DC }, /* HEBREW LETTER LAMED */
01179     { "afii57677", 0x05DD }, /* HEBREW LETTER FINAL MEM */
01180     { "afii57678", 0x05DE }, /* HEBREW LETTER MEM */
01181     { "afii57679", 0x05DF }, /* HEBREW LETTER FINAL NUN */
01182     { "afii57680", 0x05E0 }, /* HEBREW LETTER NUN */
01183     { "afii57681", 0x05E1 }, /* HEBREW LETTER SAMEKH */
01184     { "afii57682", 0x05E2 }, /* HEBREW LETTER AYIN */
01185     { "afii57683", 0x05E3 }, /* HEBREW LETTER FINAL PE */
01186     { "afii57684", 0x05E4 }, /* HEBREW LETTER PE */
01187     { "afii57685", 0x05E5 }, /* HEBREW LETTER FINAL TSADI */
01188     { "afii57686", 0x05E6 }, /* HEBREW LETTER TSADI */
01189     { "afii57687", 0x05E7 }, /* HEBREW LETTER QOF */
01190     { "afii57688", 0x05E8 }, /* HEBREW LETTER RESH */
01191     { "afii57689", 0x05E9 }, /* HEBREW LETTER SHIN */
01192     { "afii57690", 0x05EA }, /* HEBREW LETTER TAV */
01193     { "afii57694", 0xFB2A }, /* HEBREW LETTER SHIN WITH SHIN DOT */
01194     { "afii57695", 0xFB2B }, /* HEBREW LETTER SHIN WITH SIN DOT */
01195     { "afii57700", 0xFB4B }, /* HEBREW LETTER VAV WITH HOLAM */
01196     { "afii57705", 0xFB1F }, /* HEBREW LIGATURE YIDDISH YOD YOD PATAH */
01197     { "afii57716", 0x05F0 }, /* HEBREW LIGATURE YIDDISH DOUBLE VAV */
01198     { "afii57717", 0x05F1 }, /* HEBREW LIGATURE YIDDISH VAV YOD */
01199     { "afii57718", 0x05F2 }, /* HEBREW LIGATURE YIDDISH DOUBLE YOD */
01200     { "afii57723", 0xFB35 }, /* HEBREW LETTER VAV WITH DAGESH */
01201     { "afii57793", 0x05B4 }, /* HEBREW POINT HIRIQ */
01202     { "afii57794", 0x05B5 }, /* HEBREW POINT TSERE */
01203     { "afii57795", 0x05B6 }, /* HEBREW POINT SEGOL */
01204     { "afii57796", 0x05BB }, /* HEBREW POINT QUBUTS */
01205     { "afii57797", 0x05B8 }, /* HEBREW POINT QAMATS */
01206     { "afii57798", 0x05B7 }, /* HEBREW POINT PATAH */
01207     { "afii57799", 0x05B0 }, /* HEBREW POINT SHEVA */
01208     { "afii57800", 0x05B2 }, /* HEBREW POINT HATAF PATAH */
01209     { "afii57801", 0x05B1 }, /* HEBREW POINT HATAF SEGOL */
01210     { "afii57802", 0x05B3 }, /* HEBREW POINT HATAF QAMATS */
01211     { "afii57803", 0x05C2 }, /* HEBREW POINT SIN DOT */
01212     { "afii57804", 0x05C1 }, /* HEBREW POINT SHIN DOT */
01213     { "afii57806", 0x05B9 }, /* HEBREW POINT HOLAM */
01214     { "afii57807", 0x05BC }, /* HEBREW POINT DAGESH OR MAPIQ */
01215     { "afii57839", 0x05BD }, /* HEBREW POINT METEG */
01216     { "afii57841", 0x05BF }, /* HEBREW POINT RAFE */
01217     { "afii57842", 0x05C0 }, /* HEBREW PUNCTUATION PASEQ */
01218     { "afii57929", 0x02BC }, /* MODIFIER LETTER APOSTROPHE */
01219     { "afii61248", 0x2105 }, /* CARE OF */
01220     { "afii61289", 0x2113 }, /* SCRIPT SMALL L */
01221     { "afii61352", 0x2116 }, /* NUMERO SIGN */
01222     { "afii61573", 0x202C }, /* POP DIRECTIONAL FORMATTING */
01223     { "afii61574", 0x202D }, /* LEFT-TO-RIGHT OVERRIDE */
01224     { "afii61575", 0x202E }, /* RIGHT-TO-LEFT OVERRIDE */
01225     { "afii61664", 0x200C }, /* ZERO WIDTH NON-JOINER */
01226     { "afii63167", 0x066D }, /* ARABIC FIVE POINTED STAR */
01227     { "afii64937", 0x02BD }, /* MODIFIER LETTER REVERSED COMMA */
01228     { "agrave", 0x00E0 }, /* LATIN SMALL LETTER A WITH GRAVE */
01229     { "aleph", 0x2135 }, /* ALEF SYMBOL */
01230     { "alpha", 0x03B1 }, /* GREEK SMALL LETTER ALPHA */
01231     { "alphatonos", 0x03AC }, /* GREEK SMALL LETTER ALPHA WITH TONOS */
01232     { "amacron", 0x0101 }, /* LATIN SMALL LETTER A WITH MACRON */
01233     { "ampersand", 0x0026 }, /* AMPERSAND */
01234     { "ampersandsmall", 0xF726 }, /* SMALL CAPITAL AMPERSAND */
01235     { "angle", 0x2220 }, /* ANGLE */
01236     { "angleleft", 0x2329 }, /* LEFT-POINTING ANGLE BRACKET */
01237     { "angleright", 0x232A }, /* RIGHT-POINTING ANGLE BRACKET */
01238     { "anoteleia", 0x0387 }, /* GREEK ANO TELEIA */
01239     { "aogonek", 0x0105 }, /* LATIN SMALL LETTER A WITH OGONEK */
01240     { "approxequal", 0x2248 }, /* ALMOST EQUAL TO */
01241     { "aring", 0x00E5 }, /* LATIN SMALL LETTER A WITH RING ABOVE */
01242     { "aringacute", 0x01FB }, /* LATIN SMALL LETTER A WITH RING ABOVE AND ACUTE */
01243     { "arrowboth", 0x2194 }, /* LEFT RIGHT ARROW */
01244     { "arrowdblboth", 0x21D4 }, /* LEFT RIGHT DOUBLE ARROW */
01245     { "arrowdbldown", 0x21D3 }, /* DOWNWARDS DOUBLE ARROW */
01246     { "arrowdblleft", 0x21D0 }, /* LEFTWARDS DOUBLE ARROW */
01247     { "arrowdblright", 0x21D2 }, /* RIGHTWARDS DOUBLE ARROW */
01248     { "arrowdblup", 0x21D1 }, /* UPWARDS DOUBLE ARROW */
01249     { "arrowdown", 0x2193 }, /* DOWNWARDS ARROW */
01250     { "arrowhorizex", 0xF8E7 }, /* HORIZONTAL ARROW EXTENDER */
01251     { "arrowleft", 0x2190 }, /* LEFTWARDS ARROW */
01252     { "arrowright", 0x2192 }, /* RIGHTWARDS ARROW */
01253     { "arrowup", 0x2191 }, /* UPWARDS ARROW */
01254     { "arrowupdn", 0x2195 }, /* UP DOWN ARROW */
01255     { "arrowupdnbse", 0x21A8 }, /* UP DOWN ARROW WITH BASE */
01256     { "arrowvertex", 0xF8E6 }, /* VERTICAL ARROW EXTENDER */
01257     { "asciicircum", 0x005E }, /* CIRCUMFLEX ACCENT */
01258     { "asciitilde", 0x007E }, /* TILDE */
01259     { "asterisk", 0x002A }, /* ASTERISK */
01260     { "asteriskmath", 0x2217 }, /* ASTERISK OPERATOR */
01261     { "asuperior", 0xF6E9 }, /* SUPERSCRIPT LATIN SMALL LETTER A */
01262     { "at", 0x0040 }, /* COMMERCIAL AT */
01263     { "atilde", 0x00E3 }, /* LATIN SMALL LETTER A WITH TILDE */
01264     { "b", 0x0062 }, /* LATIN SMALL LETTER B */
01265     { "backslash", 0x005C }, /* REVERSE SOLIDUS */
01266     { "bar", 0x007C }, /* VERTICAL LINE */
01267     { "beta", 0x03B2 }, /* GREEK SMALL LETTER BETA */
01268     { "block", 0x2588 }, /* FULL BLOCK */
01269     { "braceex", 0xF8F4 }, /* CURLY BRACKET EXTENDER */
01270     { "braceleft", 0x007B }, /* LEFT CURLY BRACKET */
01271     { "braceleftbt", 0xF8F3 }, /* LEFT CURLY BRACKET BOTTOM */
01272     { "braceleftmid", 0xF8F2 }, /* LEFT CURLY BRACKET MID */
01273     { "bracelefttp", 0xF8F1 }, /* LEFT CURLY BRACKET TOP */
01274     { "braceright", 0x007D }, /* RIGHT CURLY BRACKET */
01275     { "bracerightbt", 0xF8FE }, /* RIGHT CURLY BRACKET BOTTOM */
01276     { "bracerightmid", 0xF8FD }, /* RIGHT CURLY BRACKET MID */
01277     { "bracerighttp", 0xF8FC }, /* RIGHT CURLY BRACKET TOP */
01278     { "bracketleft", 0x005B }, /* LEFT SQUARE BRACKET */
01279     { "bracketleftbt", 0xF8F0 }, /* LEFT SQUARE BRACKET BOTTOM */
01280     { "bracketleftex", 0xF8EF }, /* LEFT SQUARE BRACKET EXTENDER */
01281     { "bracketlefttp", 0xF8EE }, /* LEFT SQUARE BRACKET TOP */
01282     { "bracketright", 0x005D }, /* RIGHT SQUARE BRACKET */
01283     { "bracketrightbt", 0xF8FB }, /* RIGHT SQUARE BRACKET BOTTOM */
01284     { "bracketrightex", 0xF8FA }, /* RIGHT SQUARE BRACKET EXTENDER */
01285     { "bracketrighttp", 0xF8F9 }, /* RIGHT SQUARE BRACKET TOP */
01286     { "breve", 0x02D8 }, /* BREVE */
01287     { "brokenbar", 0x00A6 }, /* BROKEN BAR */
01288     { "bsuperior", 0xF6EA }, /* SUPERSCRIPT LATIN SMALL LETTER B */
01289     { "bullet", 0x2022 }, /* BULLET */
01290     { "c", 0x0063 }, /* LATIN SMALL LETTER C */
01291     { "cacute", 0x0107 }, /* LATIN SMALL LETTER C WITH ACUTE */
01292     { "caron", 0x02C7 }, /* CARON */
01293     { "carriagereturn", 0x21B5 }, /* DOWNWARDS ARROW WITH CORNER LEFTWARDS */
01294     { "ccaron", 0x010D }, /* LATIN SMALL LETTER C WITH CARON */
01295     { "ccedilla", 0x00E7 }, /* LATIN SMALL LETTER C WITH CEDILLA */
01296     { "ccircumflex", 0x0109 }, /* LATIN SMALL LETTER C WITH CIRCUMFLEX */
01297     { "cdotaccent", 0x010B }, /* LATIN SMALL LETTER C WITH DOT ABOVE */
01298     { "cedilla", 0x00B8 }, /* CEDILLA */
01299     { "cent", 0x00A2 }, /* CENT SIGN */
01300     { "centinferior", 0xF6DF }, /* SUBSCRIPT CENT SIGN */
01301     { "centoldstyle", 0xF7A2 }, /* OLDSTYLE CENT SIGN */
01302     { "centsuperior", 0xF6E0 }, /* SUPERSCRIPT CENT SIGN */
01303     { "chi", 0x03C7 }, /* GREEK SMALL LETTER CHI */
01304     { "circle", 0x25CB }, /* WHITE CIRCLE */
01305     { "circlemultiply", 0x2297 }, /* CIRCLED TIMES */
01306     { "circleplus", 0x2295 }, /* CIRCLED PLUS */
01307 /*     { "circumflex", 0x02C6 }, /\* MODIFIER LETTER CIRCUMFLEX ACCENT *\/ */
01308     { "circumflex", 0x005E }, /* MODIFIER LETTER CIRCUMFLEX ACCENT */
01309     { "club", 0x2663 }, /* BLACK CLUB SUIT */
01310     { "colon", 0x003A }, /* COLON */
01311     { "colonmonetary", 0x20A1 }, /* COLON SIGN */
01312     { "comma", 0x002C }, /* COMMA */
01313     { "commaaccent", 0xF6C3 }, /* COMMA BELOW */
01314     { "commainferior", 0xF6E1 }, /* SUBSCRIPT COMMA */
01315     { "commasuperior", 0xF6E2 }, /* SUPERSCRIPT COMMA */
01316     { "congruent", 0x2245 }, /* APPROXIMATELY EQUAL TO */
01317     { "copyright", 0x00A9 }, /* COPYRIGHT SIGN */
01318     { "copyrightsans", 0xF8E9 }, /* COPYRIGHT SIGN SANS SERIF */
01319     { "copyrightserif", 0xF6D9 }, /* COPYRIGHT SIGN SERIF */
01320     { "currency", 0x00A4 }, /* CURRENCY SIGN */
01321     { "cyrBreve", 0xF6D1 }, /* CAPITAL CYRILLIC BREVE */
01322     { "cyrFlex", 0xF6D2 }, /* CAPITAL CYRILLIC CIRCUMFLEX */
01323     { "cyrbreve", 0xF6D4 }, /* CYRILLIC BREVE */
01324     { "cyrflex", 0xF6D5 }, /* CYRILLIC CIRCUMFLEX */
01325     { "d", 0x0064 }, /* LATIN SMALL LETTER D */
01326     { "dagger", 0x2020 }, /* DAGGER */
01327     { "daggerdbl", 0x2021 }, /* DOUBLE DAGGER */
01328     { "dblGrave", 0xF6D3 }, /* CAPITAL DOUBLE GRAVE ACCENT */
01329     { "dblgrave", 0xF6D6 }, /* DOUBLE GRAVE ACCENT */
01330     { "dcaron", 0x010F }, /* LATIN SMALL LETTER D WITH CARON */
01331     { "dcroat", 0x0111 }, /* LATIN SMALL LETTER D WITH STROKE */
01332     { "degree", 0x00B0 }, /* DEGREE SIGN */
01333     { "delta", 0x03B4 }, /* GREEK SMALL LETTER DELTA */
01334     { "diamond", 0x2666 }, /* BLACK DIAMOND SUIT */
01335     { "dieresis", 0x00A8 }, /* DIAERESIS */
01336     { "dieresisacute", 0xF6D7 }, /* DIAERESIS ACUTE ACCENT */
01337     { "dieresisgrave", 0xF6D8 }, /* DIAERESIS GRAVE ACCENT */
01338     { "dieresistonos", 0x0385 }, /* GREEK DIALYTIKA TONOS */
01339     { "divide", 0x00F7 }, /* DIVISION SIGN */
01340     { "dkshade", 0x2593 }, /* DARK SHADE */
01341     { "dnblock", 0x2584 }, /* LOWER HALF BLOCK */
01342     { "dollar", 0x0024 }, /* DOLLAR SIGN */
01343     { "dollarinferior", 0xF6E3 }, /* SUBSCRIPT DOLLAR SIGN */
01344     { "dollaroldstyle", 0xF724 }, /* OLDSTYLE DOLLAR SIGN */
01345     { "dollarsuperior", 0xF6E4 }, /* SUPERSCRIPT DOLLAR SIGN */
01346     { "dong", 0x20AB }, /* DONG SIGN */
01347     { "dotaccent", 0x02D9 }, /* DOT ABOVE */
01348     { "dotbelowcomb", 0x0323 }, /* COMBINING DOT BELOW */
01349     { "dotlessi", 0x0131 }, /* LATIN SMALL LETTER DOTLESS I */
01350     { "dotlessj", 0xF6BE }, /* LATIN SMALL LETTER DOTLESS J */
01351     { "dotmath", 0x22C5 }, /* DOT OPERATOR */
01352     { "dsuperior", 0xF6EB }, /* SUPERSCRIPT LATIN SMALL LETTER D */
01353     { "e", 0x0065 }, /* LATIN SMALL LETTER E */
01354     { "eacute", 0x00E9 }, /* LATIN SMALL LETTER E WITH ACUTE */
01355     { "ebreve", 0x0115 }, /* LATIN SMALL LETTER E WITH BREVE */
01356     { "ecaron", 0x011B }, /* LATIN SMALL LETTER E WITH CARON */
01357     { "ecircumflex", 0x00EA }, /* LATIN SMALL LETTER E WITH CIRCUMFLEX */
01358     { "edieresis", 0x00EB }, /* LATIN SMALL LETTER E WITH DIAERESIS */
01359     { "edotaccent", 0x0117 }, /* LATIN SMALL LETTER E WITH DOT ABOVE */
01360     { "egrave", 0x00E8 }, /* LATIN SMALL LETTER E WITH GRAVE */
01361     { "eight", 0x0038 }, /* DIGIT EIGHT */
01362     { "eightinferior", 0x2088 }, /* SUBSCRIPT EIGHT */
01363     { "eightoldstyle", 0xF738 }, /* OLDSTYLE DIGIT EIGHT */
01364     { "eightsuperior", 0x2078 }, /* SUPERSCRIPT EIGHT */
01365     { "element", 0x2208 }, /* ELEMENT OF */
01366     { "ellipsis", 0x2026 }, /* HORIZONTAL ELLIPSIS */
01367     { "emacron", 0x0113 }, /* LATIN SMALL LETTER E WITH MACRON */
01368     { "emdash", 0x2014 }, /* EM DASH */
01369     { "emptyset", 0x2205 }, /* EMPTY SET */
01370     { "endash", 0x2013 }, /* EN DASH */
01371     { "eng", 0x014B }, /* LATIN SMALL LETTER ENG */
01372     { "eogonek", 0x0119 }, /* LATIN SMALL LETTER E WITH OGONEK */
01373     { "epsilon", 0x03B5 }, /* GREEK SMALL LETTER EPSILON */
01374     { "epsilontonos", 0x03AD }, /* GREEK SMALL LETTER EPSILON WITH TONOS */
01375     { "equal", 0x003D }, /* EQUALS SIGN */
01376     { "equivalence", 0x2261 }, /* IDENTICAL TO */
01377     { "estimated", 0x212E }, /* ESTIMATED SYMBOL */
01378     { "esuperior", 0xF6EC }, /* SUPERSCRIPT LATIN SMALL LETTER E */
01379     { "eta", 0x03B7 }, /* GREEK SMALL LETTER ETA */
01380     { "etatonos", 0x03AE }, /* GREEK SMALL LETTER ETA WITH TONOS */
01381     { "eth", 0x00F0 }, /* LATIN SMALL LETTER ETH */
01382     { "exclam", 0x0021 }, /* EXCLAMATION MARK */
01383     { "exclamdbl", 0x203C }, /* DOUBLE EXCLAMATION MARK */
01384     { "exclamdown", 0x00A1 }, /* INVERTED EXCLAMATION MARK */
01385     { "exclamdownsmall", 0xF7A1 }, /* SMALL CAPITAL INVERTED EXCLAMATION MARK */
01386     { "exclamsmall", 0xF721 }, /* SMALL CAPITAL EXCLAMATION MARK */
01387     { "existential", 0x2203 }, /* THERE EXISTS */
01388     { "f", 0x0066 }, /* LATIN SMALL LETTER F */
01389     { "female", 0x2640 }, /* FEMALE SIGN */
01390     { "ff", 0xFB00 }, /* LATIN SMALL LIGATURE FF */
01391     { "ffi", 0xFB03 }, /* LATIN SMALL LIGATURE FFI */
01392     { "ffl", 0xFB04 }, /* LATIN SMALL LIGATURE FFL */
01393     { "fi", 0xFB01 }, /* LATIN SMALL LIGATURE FI */
01394     { "figuredash", 0x2012 }, /* FIGURE DASH */
01395     { "filledbox", 0x25A0 }, /* BLACK SQUARE */
01396     { "filledrect", 0x25AC }, /* BLACK RECTANGLE */
01397     { "five", 0x0035 }, /* DIGIT FIVE */
01398     { "fiveeighths", 0x215D }, /* VULGAR FRACTION FIVE EIGHTHS */
01399     { "fiveinferior", 0x2085 }, /* SUBSCRIPT FIVE */
01400     { "fiveoldstyle", 0xF735 }, /* OLDSTYLE DIGIT FIVE */
01401     { "fivesuperior", 0x2075 }, /* SUPERSCRIPT FIVE */
01402     { "fl", 0xFB02 }, /* LATIN SMALL LIGATURE FL */
01403     { "florin", 0x0192 }, /* LATIN SMALL LETTER F WITH HOOK */
01404     { "four", 0x0034 }, /* DIGIT FOUR */
01405     { "fourinferior", 0x2084 }, /* SUBSCRIPT FOUR */
01406     { "fouroldstyle", 0xF734 }, /* OLDSTYLE DIGIT FOUR */
01407     { "foursuperior", 0x2074 }, /* SUPERSCRIPT FOUR */
01408     { "fraction", 0x2044 }, /* FRACTION SLASH */
01409 #if 0
01410     { "fraction" DUP2, 0x2215 }, /* DIVISION SLASH;Duplicate */
01411 #endif /* 0 */
01412     { "franc", 0x20A3 }, /* FRENCH FRANC SIGN */
01413     { "ft", 0xFB05 }, /* LATIN SMALL LIGATURE FT */
01414     { "g", 0x0067 }, /* LATIN SMALL LETTER G */
01415     { "gamma", 0x03B3 }, /* GREEK SMALL LETTER GAMMA */
01416     { "gbreve", 0x011F }, /* LATIN SMALL LETTER G WITH BREVE */
01417     { "gcaron", 0x01E7 }, /* LATIN SMALL LETTER G WITH CARON */
01418     { "gcircumflex", 0x011D }, /* LATIN SMALL LETTER G WITH CIRCUMFLEX */
01419     { "gcommaaccent", 0x0123 }, /* LATIN SMALL LETTER G WITH CEDILLA */
01420     { "gdotaccent", 0x0121 }, /* LATIN SMALL LETTER G WITH DOT ABOVE */
01421     { "germandbls", 0x00DF }, /* LATIN SMALL LETTER SHARP S */
01422     { "gradient", 0x2207 }, /* NABLA */
01423     { "grave", 0x0060 }, /* GRAVE ACCENT */
01424     { "gravecomb", 0x0300 }, /* COMBINING GRAVE ACCENT */
01425     { "greater", 0x003E }, /* GREATER-THAN SIGN */
01426     { "greaterequal", 0x2265 }, /* GREATER-THAN OR EQUAL TO */
01427     { "guillemotleft", 0x00AB }, /* LEFT-POINTING DOUBLE ANGLE QUOTATION MARK */
01428     { "guillemotright", 0x00BB }, /* RIGHT-POINTING DOUBLE ANGLE QUOTATION MARK */
01429     { "guilsinglleft", 0x2039 }, /* SINGLE LEFT-POINTING ANGLE QUOTATION MARK */
01430     { "guilsinglright", 0x203A }, /* SINGLE RIGHT-POINTING ANGLE QUOTATION MARK */
01431     { "h", 0x0068 }, /* LATIN SMALL LETTER H */
01432     { "hbar", 0x0127 }, /* LATIN SMALL LETTER H WITH STROKE */
01433     { "hcircumflex", 0x0125 }, /* LATIN SMALL LETTER H WITH CIRCUMFLEX */
01434     { "heart", 0x2665 }, /* BLACK HEART SUIT */
01435     { "hookabovecomb", 0x0309 }, /* COMBINING HOOK ABOVE */
01436     { "house", 0x2302 }, /* HOUSE */
01437     { "hungarumlaut", 0x02DD }, /* DOUBLE ACUTE ACCENT */
01438     { "hyphen", 0x002D }, /* HYPHEN-MINUS */
01439 #if 0
01440     { "hyphen" DUP2, 0x00AD }, /* SOFT HYPHEN;Duplicate */
01441 #endif /* 0 */
01442     { "hypheninferior", 0xF6E5 }, /* SUBSCRIPT HYPHEN-MINUS */
01443     { "hyphensuperior", 0xF6E6 }, /* SUPERSCRIPT HYPHEN-MINUS */
01444     { "i", 0x0069 }, /* LATIN SMALL LETTER I */
01445     { "iacute", 0x00ED }, /* LATIN SMALL LETTER I WITH ACUTE */
01446     { "ibreve", 0x012D }, /* LATIN SMALL LETTER I WITH BREVE */
01447     { "icircumflex", 0x00EE }, /* LATIN SMALL LETTER I WITH CIRCUMFLEX */
01448     { "idieresis", 0x00EF }, /* LATIN SMALL LETTER I WITH DIAERESIS */
01449     { "igrave", 0x00EC }, /* LATIN SMALL LETTER I WITH GRAVE */
01450     { "ij", 0x0133 }, /* LATIN SMALL LIGATURE IJ */
01451     { "imacron", 0x012B }, /* LATIN SMALL LETTER I WITH MACRON */
01452     { "infinity", 0x221E }, /* INFINITY */
01453     { "integral", 0x222B }, /* INTEGRAL */
01454     { "integralbt", 0x2321 }, /* BOTTOM HALF INTEGRAL */
01455     { "integralex", 0xF8F5 }, /* INTEGRAL EXTENDER */
01456     { "integraltp", 0x2320 }, /* TOP HALF INTEGRAL */
01457     { "intersection", 0x2229 }, /* INTERSECTION */
01458     { "invbullet", 0x25D8 }, /* INVERSE BULLET */
01459     { "invcircle", 0x25D9 }, /* INVERSE WHITE CIRCLE */
01460     { "invsmileface", 0x263B }, /* BLACK SMILING FACE */
01461     { "iogonek", 0x012F }, /* LATIN SMALL LETTER I WITH OGONEK */
01462     { "iota", 0x03B9 }, /* GREEK SMALL LETTER IOTA */
01463     { "iotadieresis", 0x03CA }, /* GREEK SMALL LETTER IOTA WITH DIALYTIKA */
01464     { "iotadieresistonos", 0x0390 }, /* GREEK SMALL LETTER IOTA WITH DIALYTIKA AND TONOS */
01465     { "iotatonos", 0x03AF }, /* GREEK SMALL LETTER IOTA WITH TONOS */
01466     { "isuperior", 0xF6ED }, /* SUPERSCRIPT LATIN SMALL LETTER I */
01467     { "itilde", 0x0129 }, /* LATIN SMALL LETTER I WITH TILDE */
01468     { "j", 0x006A }, /* LATIN SMALL LETTER J */
01469     { "jcircumflex", 0x0135 }, /* LATIN SMALL LETTER J WITH CIRCUMFLEX */
01470     { "k", 0x006B }, /* LATIN SMALL LETTER K */
01471     { "kappa", 0x03BA }, /* GREEK SMALL LETTER KAPPA */
01472     { "kcommaaccent", 0x0137 }, /* LATIN SMALL LETTER K WITH CEDILLA */
01473     { "kgreenlandic", 0x0138 }, /* LATIN SMALL LETTER KRA */
01474     { "l", 0x006C }, /* LATIN SMALL LETTER L */
01475     { "lacute", 0x013A }, /* LATIN SMALL LETTER L WITH ACUTE */
01476     { "lambda", 0x03BB }, /* GREEK SMALL LETTER LAMDA */
01477     { "lcaron", 0x013E }, /* LATIN SMALL LETTER L WITH CARON */
01478     { "lcommaaccent", 0x013C }, /* LATIN SMALL LETTER L WITH CEDILLA */
01479     { "ldot", 0x0140 }, /* LATIN SMALL LETTER L WITH MIDDLE DOT */
01480     { "less", 0x003C }, /* LESS-THAN SIGN */
01481     { "lessequal", 0x2264 }, /* LESS-THAN OR EQUAL TO */
01482     { "lfblock", 0x258C }, /* LEFT HALF BLOCK */
01483     { "lira", 0x20A4 }, /* LIRA SIGN */
01484     { "ll", 0xF6C0 }, /* LATIN SMALL LETTER LL */
01485     { "logicaland", 0x2227 }, /* LOGICAL AND */
01486     { "logicalnot", 0x00AC }, /* NOT SIGN */
01487     { "logicalor", 0x2228 }, /* LOGICAL OR */
01488     { "longs", 0x017F }, /* LATIN SMALL LETTER LONG S */
01489     { "lozenge", 0x25CA }, /* LOZENGE */
01490     { "lslash", 0x0142 }, /* LATIN SMALL LETTER L WITH STROKE */
01491     { "lsuperior", 0xF6EE }, /* SUPERSCRIPT LATIN SMALL LETTER L */
01492     { "ltshade", 0x2591 }, /* LIGHT SHADE */
01493     { "m", 0x006D }, /* LATIN SMALL LETTER M */
01494     { "macron", 0x00AF }, /* MACRON */
01495 #if 0
01496     { "macron" DUP2, 0x02C9 }, /* MODIFIER LETTER MACRON;Duplicate */
01497 #endif /* 0 */
01498     { "male", 0x2642 }, /* MALE SIGN */
01499     { "minus", 0x2212 }, /* MINUS SIGN */
01500     { "minute", 0x2032 }, /* PRIME */
01501     { "msuperior", 0xF6EF }, /* SUPERSCRIPT LATIN SMALL LETTER M */
01502     { "mu", 0x00B5 }, /* MICRO SIGN */
01503 #if 0
01504     { "mu" DUP2, 0x03BC }, /* GREEK SMALL LETTER MU;Duplicate */
01505 #endif /* 0 */
01506     { "multiply", 0x00D7 }, /* MULTIPLICATION SIGN */
01507     { "musicalnote", 0x266A }, /* EIGHTH NOTE */
01508     { "musicalnotedbl", 0x266B }, /* BEAMED EIGHTH NOTES */
01509     { "n", 0x006E }, /* LATIN SMALL LETTER N */
01510     { "nacute", 0x0144 }, /* LATIN SMALL LETTER N WITH ACUTE */
01511     { "napostrophe", 0x0149 }, /* LATIN SMALL LETTER N PRECEDED BY APOSTROPHE */
01512     { "ncaron", 0x0148 }, /* LATIN SMALL LETTER N WITH CARON */
01513     { "ncommaaccent", 0x0146 }, /* LATIN SMALL LETTER N WITH CEDILLA */
01514     { "nine", 0x0039 }, /* DIGIT NINE */
01515     { "nineinferior", 0x2089 }, /* SUBSCRIPT NINE */
01516     { "nineoldstyle", 0xF739 }, /* OLDSTYLE DIGIT NINE */
01517     { "ninesuperior", 0x2079 }, /* SUPERSCRIPT NINE */
01518     { "notelement", 0x2209 }, /* NOT AN ELEMENT OF */
01519     { "notequal", 0x2260 }, /* NOT EQUAL TO */
01520     { "notsubset", 0x2284 }, /* NOT A SUBSET OF */
01521     { "nsuperior", 0x207F }, /* SUPERSCRIPT LATIN SMALL LETTER N */
01522     { "ntilde", 0x00F1 }, /* LATIN SMALL LETTER N WITH TILDE */
01523     { "nu", 0x03BD }, /* GREEK SMALL LETTER NU */
01524     { "numbersign", 0x0023 }, /* NUMBER SIGN */
01525     { "o", 0x006F }, /* LATIN SMALL LETTER O */
01526     { "oacute", 0x00F3 }, /* LATIN SMALL LETTER O WITH ACUTE */
01527     { "obreve", 0x014F }, /* LATIN SMALL LETTER O WITH BREVE */
01528     { "ocircumflex", 0x00F4 }, /* LATIN SMALL LETTER O WITH CIRCUMFLEX */
01529     { "odieresis", 0x00F6 }, /* LATIN SMALL LETTER O WITH DIAERESIS */
01530     { "oe", 0x0153 }, /* LATIN SMALL LIGATURE OE */
01531     { "ogonek", 0x02DB }, /* OGONEK */
01532     { "ograve", 0x00F2 }, /* LATIN SMALL LETTER O WITH GRAVE */
01533     { "ohorn", 0x01A1 }, /* LATIN SMALL LETTER O WITH HORN */
01534     { "ohungarumlaut", 0x0151 }, /* LATIN SMALL LETTER O WITH DOUBLE ACUTE */
01535     { "omacron", 0x014D }, /* LATIN SMALL LETTER O WITH MACRON */
01536     { "omega", 0x03C9 }, /* GREEK SMALL LETTER OMEGA */
01537     { "omega1", 0x03D6 }, /* GREEK PI SYMBOL */
01538     { "omegatonos", 0x03CE }, /* GREEK SMALL LETTER OMEGA WITH TONOS */
01539     { "omicron", 0x03BF }, /* GREEK SMALL LETTER OMICRON */
01540     { "omicrontonos", 0x03CC }, /* GREEK SMALL LETTER OMICRON WITH TONOS */
01541     { "one", 0x0031 }, /* DIGIT ONE */
01542     { "onedotenleader", 0x2024 }, /* ONE DOT LEADER */
01543     { "oneeighth", 0x215B }, /* VULGAR FRACTION ONE EIGHTH */
01544     { "onefitted", 0xF6DC }, /* PROPORTIONAL DIGIT ONE */
01545     { "onehalf", 0x00BD }, /* VULGAR FRACTION ONE HALF */
01546     { "oneinferior", 0x2081 }, /* SUBSCRIPT ONE */
01547     { "oneoldstyle", 0xF731 }, /* OLDSTYLE DIGIT ONE */
01548     { "onequarter", 0x00BC }, /* VULGAR FRACTION ONE QUARTER */
01549     { "onesuperior", 0x00B9 }, /* SUPERSCRIPT ONE */
01550     { "onethird", 0x2153 }, /* VULGAR FRACTION ONE THIRD */
01551     { "openbullet", 0x25E6 }, /* WHITE BULLET */
01552     { "ordfeminine", 0x00AA }, /* FEMININE ORDINAL INDICATOR */
01553     { "ordmasculine", 0x00BA }, /* MASCULINE ORDINAL INDICATOR */
01554     { "orthogonal", 0x221F }, /* RIGHT ANGLE */
01555     { "oslash", 0x00F8 }, /* LATIN SMALL LETTER O WITH STROKE */
01556     { "oslashacute", 0x01FF }, /* LATIN SMALL LETTER O WITH STROKE AND ACUTE */
01557     { "osuperior", 0xF6F0 }, /* SUPERSCRIPT LATIN SMALL LETTER O */
01558     { "otilde", 0x00F5 }, /* LATIN SMALL LETTER O WITH TILDE */
01559     { "p", 0x0070 }, /* LATIN SMALL LETTER P */
01560     { "paragraph", 0x00B6 }, /* PILCROW SIGN */
01561     { "parenleft", 0x0028 }, /* LEFT PARENTHESIS */
01562     { "parenleftbt", 0xF8ED }, /* LEFT PAREN BOTTOM */
01563     { "parenleftex", 0xF8EC }, /* LEFT PAREN EXTENDER */
01564     { "parenleftinferior", 0x208D }, /* SUBSCRIPT LEFT PARENTHESIS */
01565     { "parenleftsuperior", 0x207D }, /* SUPERSCRIPT LEFT PARENTHESIS */
01566     { "parenlefttp", 0xF8EB }, /* LEFT PAREN TOP */
01567     { "parenright", 0x0029 }, /* RIGHT PARENTHESIS */
01568     { "parenrightbt", 0xF8F8 }, /* RIGHT PAREN BOTTOM */
01569     { "parenrightex", 0xF8F7 }, /* RIGHT PAREN EXTENDER */
01570     { "parenrightinferior", 0x208E }, /* SUBSCRIPT RIGHT PARENTHESIS */
01571     { "parenrightsuperior", 0x207E }, /* SUPERSCRIPT RIGHT PARENTHESIS */
01572     { "parenrighttp", 0xF8F6 }, /* RIGHT PAREN TOP */
01573     { "partialdiff", 0x2202 }, /* PARTIAL DIFFERENTIAL */
01574     { "percent", 0x0025 }, /* PERCENT SIGN */
01575     { "period", 0x002E }, /* FULL STOP */
01576     { "periodcentered", 0x00B7 }, /* MIDDLE DOT */
01577 #if 0
01578     { "periodcentered" DUP2, 0x2219 }, /* BULLET OPERATOR;Duplicate */
01579 #endif /* 0 */
01580     { "periodinferior", 0xF6E7 }, /* SUBSCRIPT FULL STOP */
01581     { "periodsuperior", 0xF6E8 }, /* SUPERSCRIPT FULL STOP */
01582     { "perpendicular", 0x22A5 }, /* UP TACK */
01583     { "perthousand", 0x2030 }, /* PER MILLE SIGN */
01584     { "peseta", 0x20A7 }, /* PESETA SIGN */
01585     { "phi", 0x03C6 }, /* GREEK SMALL LETTER PHI */
01586     { "phi1", 0x03D5 }, /* GREEK PHI SYMBOL */
01587     { "pi", 0x03C0 }, /* GREEK SMALL LETTER PI */
01588     { "plus", 0x002B }, /* PLUS SIGN */
01589     { "plusminus", 0x00B1 }, /* PLUS-MINUS SIGN */
01590     { "prescription", 0x211E }, /* PRESCRIPTION TAKE */
01591     { "product", 0x220F }, /* N-ARY PRODUCT */
01592     { "propersubset", 0x2282 }, /* SUBSET OF */
01593     { "propersuperset", 0x2283 }, /* SUPERSET OF */
01594     { "proportional", 0x221D }, /* PROPORTIONAL TO */
01595     { "psi", 0x03C8 }, /* GREEK SMALL LETTER PSI */
01596     { "q", 0x0071 }, /* LATIN SMALL LETTER Q */
01597     { "question", 0x003F }, /* QUESTION MARK */
01598     { "questiondown", 0x00BF }, /* INVERTED QUESTION MARK */
01599     { "questiondownsmall", 0xF7BF }, /* SMALL CAPITAL INVERTED QUESTION MARK */
01600     { "questionsmall", 0xF73F }, /* SMALL CAPITAL QUESTION MARK */
01601     { "quotedbl", 0x0022 }, /* QUOTATION MARK */
01602     { "quotedblbase", 0x201E }, /* DOUBLE LOW-9 QUOTATION MARK */
01603     { "quotedblleft", 0x201C }, /* LEFT DOUBLE QUOTATION MARK */
01604     { "quotedblright", 0x201D }, /* RIGHT DOUBLE QUOTATION MARK */
01605     { "quoteleft", 0x2018 }, /* LEFT SINGLE QUOTATION MARK */
01606     { "quotereversed", 0x201B }, /* SINGLE HIGH-REVERSED-9 QUOTATION MARK */
01607     { "quoteright", 0x2019 }, /* RIGHT SINGLE QUOTATION MARK */
01608     { "quotesinglbase", 0x201A }, /* SINGLE LOW-9 QUOTATION MARK */
01609     { "quotesingle", 0x0027 }, /* APOSTROPHE */
01610     { "r", 0x0072 }, /* LATIN SMALL LETTER R */
01611     { "racute", 0x0155 }, /* LATIN SMALL LETTER R WITH ACUTE */
01612     { "radical", 0x221A }, /* SQUARE ROOT */
01613     { "radicalex", 0xF8E5 }, /* RADICAL EXTENDER */
01614     { "rcaron", 0x0159 }, /* LATIN SMALL LETTER R WITH CARON */
01615     { "rcommaaccent", 0x0157 }, /* LATIN SMALL LETTER R WITH CEDILLA */
01616     { "reflexsubset", 0x2286 }, /* SUBSET OF OR EQUAL TO */
01617     { "reflexsuperset", 0x2287 }, /* SUPERSET OF OR EQUAL TO */
01618     { "registered", 0x00AE }, /* REGISTERED SIGN */
01619     { "registersans", 0xF8E8 }, /* REGISTERED SIGN SANS SERIF */
01620     { "registerserif", 0xF6DA }, /* REGISTERED SIGN SERIF */
01621     { "revlogicalnot", 0x2310 }, /* REVERSED NOT SIGN */
01622     { "rho", 0x03C1 }, /* GREEK SMALL LETTER RHO */
01623     { "ring", 0x02DA }, /* RING ABOVE */
01624     { "rsuperior", 0xF6F1 }, /* SUPERSCRIPT LATIN SMALL LETTER R */
01625     { "rtblock", 0x2590 }, /* RIGHT HALF BLOCK */
01626     { "rupiah", 0xF6DD }, /* RUPIAH SIGN */
01627     { "s", 0x0073 }, /* LATIN SMALL LETTER S */
01628     { "sacute", 0x015B }, /* LATIN SMALL LETTER S WITH ACUTE */
01629     { "scaron", 0x0161 }, /* LATIN SMALL LETTER S WITH CARON */
01630     { "scedilla", 0x015F }, /* LATIN SMALL LETTER S WITH CEDILLA */
01631 #if 0
01632     { "scedilla" DUP2, 0xF6C2 }, /* LATIN SMALL LETTER S WITH CEDILLA;Duplicate */
01633 #endif /* 0 */
01634     { "scircumflex", 0x015D }, /* LATIN SMALL LETTER S WITH CIRCUMFLEX */
01635     { "scommaaccent", 0x0219 }, /* LATIN SMALL LETTER S WITH COMMA BELOW */
01636     { "second", 0x2033 }, /* DOUBLE PRIME */
01637     { "section", 0x00A7 }, /* SECTION SIGN */
01638     { "semicolon", 0x003B }, /* SEMICOLON */
01639     { "seven", 0x0037 }, /* DIGIT SEVEN */
01640     { "seveneighths", 0x215E }, /* VULGAR FRACTION SEVEN EIGHTHS */
01641     { "seveninferior", 0x2087 }, /* SUBSCRIPT SEVEN */
01642     { "sevenoldstyle", 0xF737 }, /* OLDSTYLE DIGIT SEVEN */
01643     { "sevensuperior", 0x2077 }, /* SUPERSCRIPT SEVEN */
01644     { "shade", 0x2592 }, /* MEDIUM SHADE */
01645     { "sigma", 0x03C3 }, /* GREEK SMALL LETTER SIGMA */
01646     { "sigma1", 0x03C2 }, /* GREEK SMALL LETTER FINAL SIGMA */
01647     { "similar", 0x223C }, /* TILDE OPERATOR */
01648     { "six", 0x0036 }, /* DIGIT SIX */
01649     { "sixinferior", 0x2086 }, /* SUBSCRIPT SIX */
01650     { "sixoldstyle", 0xF736 }, /* OLDSTYLE DIGIT SIX */
01651     { "sixsuperior", 0x2076 }, /* SUPERSCRIPT SIX */
01652     { "slash", 0x002F }, /* SOLIDUS */
01653     { "smileface", 0x263A }, /* WHITE SMILING FACE */
01654     { "space", 0x0020 }, /* SPACE */
01655 #if 0
01656     { "space" DUP2, 0x00A0 }, /* NO-BREAK SPACE;Duplicate */
01657 #endif /* 0 */
01658     { "spade", 0x2660 }, /* BLACK SPADE SUIT */
01659     { "ssuperior", 0xF6F2 }, /* SUPERSCRIPT LATIN SMALL LETTER S */
01660     { "st", 0xFB06 }, /* LATIN SMALL LIGATURE ST */
01661     { "sterling", 0x00A3 }, /* POUND SIGN */
01662     { "suchthat", 0x220B }, /* CONTAINS AS MEMBER */
01663     { "summation", 0x2211 }, /* N-ARY SUMMATION */
01664     { "summationtext", 0x2211 }, /* N-ARY SUMMATION - apparently this is the name used in cmex? */
01665     { "sun", 0x263C }, /* WHITE SUN WITH RAYS */
01666     { "t", 0x0074 }, /* LATIN SMALL LETTER T */
01667     { "tau", 0x03C4 }, /* GREEK SMALL LETTER TAU */
01668     { "tbar", 0x0167 }, /* LATIN SMALL LETTER T WITH STROKE */
01669     { "tcaron", 0x0165 }, /* LATIN SMALL LETTER T WITH CARON */
01670     { "tcommaaccent", 0x0163 }, /* LATIN SMALL LETTER T WITH CEDILLA */
01671 #if 0
01672     { "tcommaaccent" DUP2, 0x021B }, /* LATIN SMALL LETTER T WITH COMMA BELOW;Duplicate */
01673 #endif /* 0 */
01674     { "therefore", 0x2234 }, /* THEREFORE */
01675     { "theta", 0x03B8 }, /* GREEK SMALL LETTER THETA */
01676     { "theta1", 0x03D1 }, /* GREEK THETA SYMBOL */
01677     { "thorn", 0x00FE }, /* LATIN SMALL LETTER THORN */
01678     { "three", 0x0033 }, /* DIGIT THREE */
01679     { "threeeighths", 0x215C }, /* VULGAR FRACTION THREE EIGHTHS */
01680     { "threeinferior", 0x2083 }, /* SUBSCRIPT THREE */
01681     { "threeoldstyle", 0xF733 }, /* OLDSTYLE DIGIT THREE */
01682     { "threequarters", 0x00BE }, /* VULGAR FRACTION THREE QUARTERS */
01683     { "threequartersemdash", 0xF6DE }, /* THREE QUARTERS EM DASH */
01684     { "threesuperior", 0x00B3 }, /* SUPERSCRIPT THREE */
01685 /*     { "tilde", 0x02DC }, /\* SMALL TILDE *\/ */
01686     { "tilde", 0x007E }, /* ASCII TILDE */
01687     { "tildecomb", 0x0303 }, /* COMBINING TILDE */
01688     { "tonos", 0x0384 }, /* GREEK TONOS */
01689     { "trademark", 0x2122 }, /* TRADE MARK SIGN */
01690     { "trademarksans", 0xF8EA }, /* TRADE MARK SIGN SANS SERIF */
01691     { "trademarkserif", 0xF6DB }, /* TRADE MARK SIGN SERIF */
01692     { "triagdn", 0x25BC }, /* BLACK DOWN-POINTING TRIANGLE */
01693     { "triaglf", 0x25C4 }, /* BLACK LEFT-POINTING POINTER */
01694     { "triagrt", 0x25BA }, /* BLACK RIGHT-POINTING POINTER */
01695     { "triagup", 0x25B2 }, /* BLACK UP-POINTING TRIANGLE */
01696     { "tsuperior", 0xF6F3 }, /* SUPERSCRIPT LATIN SMALL LETTER T */
01697     { "two", 0x0032 }, /* DIGIT TWO */
01698     { "twodotenleader", 0x2025 }, /* TWO DOT LEADER */
01699     { "twoinferior", 0x2082 }, /* SUBSCRIPT TWO */
01700     { "twooldstyle", 0xF732 }, /* OLDSTYLE DIGIT TWO */
01701     { "twosuperior", 0x00B2 }, /* SUPERSCRIPT TWO */
01702     { "twothirds", 0x2154 }, /* VULGAR FRACTION TWO THIRDS */
01703     { "u", 0x0075 }, /* LATIN SMALL LETTER U */
01704     { "uacute", 0x00FA }, /* LATIN SMALL LETTER U WITH ACUTE */
01705     { "ubreve", 0x016D }, /* LATIN SMALL LETTER U WITH BREVE */
01706     { "ucircumflex", 0x00FB }, /* LATIN SMALL LETTER U WITH CIRCUMFLEX */
01707     { "udieresis", 0x00FC }, /* LATIN SMALL LETTER U WITH DIAERESIS */
01708     { "ugrave", 0x00F9 }, /* LATIN SMALL LETTER U WITH GRAVE */
01709     { "uhorn", 0x01B0 }, /* LATIN SMALL LETTER U WITH HORN */
01710     { "uhungarumlaut", 0x0171 }, /* LATIN SMALL LETTER U WITH DOUBLE ACUTE */
01711     { "umacron", 0x016B }, /* LATIN SMALL LETTER U WITH MACRON */
01712     { "underscore", 0x005F }, /* LOW LINE */
01713     { "underscoredbl", 0x2017 }, /* DOUBLE LOW LINE */
01714     { "union", 0x222A }, /* UNION */
01715     { "universal", 0x2200 }, /* FOR ALL */
01716     { "uogonek", 0x0173 }, /* LATIN SMALL LETTER U WITH OGONEK */
01717     { "upblock", 0x2580 }, /* UPPER HALF BLOCK */
01718     { "upsilon", 0x03C5 }, /* GREEK SMALL LETTER UPSILON */
01719     { "upsilondieresis", 0x03CB }, /* GREEK SMALL LETTER UPSILON WITH DIALYTIKA */
01720     { "upsilondieresistonos", 0x03B0 }, /* GREEK SMALL LETTER UPSILON WITH DIALYTIKA AND TONOS */
01721     { "upsilontonos", 0x03CD }, /* GREEK SMALL LETTER UPSILON WITH TONOS */
01722     { "uring", 0x016F }, /* LATIN SMALL LETTER U WITH RING ABOVE */
01723     { "utilde", 0x0169 }, /* LATIN SMALL LETTER U WITH TILDE */
01724     { "v", 0x0076 }, /* LATIN SMALL LETTER V */
01725     { "w", 0x0077 }, /* LATIN SMALL LETTER W */
01726     { "wacute", 0x1E83 }, /* LATIN SMALL LETTER W WITH ACUTE */
01727     { "wcircumflex", 0x0175 }, /* LATIN SMALL LETTER W WITH CIRCUMFLEX */
01728     { "wdieresis", 0x1E85 }, /* LATIN SMALL LETTER W WITH DIAERESIS */
01729     { "weierstrass", 0x2118 }, /* SCRIPT CAPITAL P */
01730     { "wgrave", 0x1E81 }, /* LATIN SMALL LETTER W WITH GRAVE */
01731     { "x", 0x0078 }, /* LATIN SMALL LETTER X */
01732     { "xi", 0x03BE }, /* GREEK SMALL LETTER XI */
01733     { "y", 0x0079 }, /* LATIN SMALL LETTER Y */
01734     { "yacute", 0x00FD }, /* LATIN SMALL LETTER Y WITH ACUTE */
01735     { "ycircumflex", 0x0177 }, /* LATIN SMALL LETTER Y WITH CIRCUMFLEX */
01736     { "ydieresis", 0x00FF }, /* LATIN SMALL LETTER Y WITH DIAERESIS */
01737     { "yen", 0x00A5 }, /* YEN SIGN */
01738     { "ygrave", 0x1EF3 }, /* LATIN SMALL LETTER Y WITH GRAVE */
01739     { "z", 0x007A }, /* LATIN SMALL LETTER Z */
01740     { "zacute", 0x017A }, /* LATIN SMALL LETTER Z WITH ACUTE */
01741     { "zcaron", 0x017E }, /* LATIN SMALL LETTER Z WITH CARON */
01742     { "zdotaccent", 0x017C }, /* LATIN SMALL LETTER Z WITH DOT ABOVE */
01743     { "zero", 0x0030 }, /* DIGIT ZERO */
01744     { "zeroinferior", 0x2080 }, /* SUBSCRIPT ZERO */
01745     { "zerooldstyle", 0xF730 }, /* OLDSTYLE DIGIT ZERO */
01746     { "zerosuperior", 0x2070 }, /* SUPERSCRIPT ZERO */
01747     { "zeta", 0x03B6 } /* GREEK SMALL LETTER ZETA */
01748 };
01749 
01750 #if 0
01751 static struct unicode2adobe unicode2adobe_table[] = {
01752     { 0, ".notdef" }, /* was: QUESTION MARK; changed to 0 */
01753     { 0x0020, "space" }, /* SPACE */
01754     { 0x0021, "exclam" }, /* EXCLAMATION MARK */
01755     { 0x0022, "quotedbl" }, /* QUOTATION MARK */
01756     { 0x0023, "numbersign" }, /* NUMBER SIGN */
01757     { 0x0024, "dollar" }, /* DOLLAR SIGN */
01758     { 0x0025, "percent" }, /* PERCENT SIGN */
01759     { 0x0026, "ampersand" }, /* AMPERSAND */
01760     { 0x0027, "quotesingle" }, /* APOSTROPHE */
01761     { 0x0028, "parenleft" }, /* LEFT PARENTHESIS */
01762     { 0x0029, "parenright" }, /* RIGHT PARENTHESIS */
01763     { 0x002A, "asterisk" }, /* ASTERISK */
01764     { 0x002B, "plus" }, /* PLUS SIGN */
01765     { 0x002C, "comma" }, /* COMMA */
01766     { 0x002D, "hyphen" }, /* HYPHEN-MINUS */
01767     { 0x002D, "$hyphen"  }, /* HYPHEN-MINUS; distinguish Adobe duplicates */
01768     { 0x002E, "period" }, /* FULL STOP */
01769     { 0x002F, "slash" }, /* SOLIDUS */
01770     { 0x0030, "zero" }, /* DIGIT ZERO */
01771     { 0x0031, "one" }, /* DIGIT ONE */
01772     { 0x0032, "two" }, /* DIGIT TWO */
01773     { 0x0033, "three" }, /* DIGIT THREE */
01774     { 0x0034, "four" }, /* DIGIT FOUR */
01775     { 0x0035, "five" }, /* DIGIT FIVE */
01776     { 0x0036, "six" }, /* DIGIT SIX */
01777     { 0x0037, "seven" }, /* DIGIT SEVEN */
01778     { 0x0038, "eight" }, /* DIGIT EIGHT */
01779     { 0x0039, "nine" }, /* DIGIT NINE */
01780     { 0x003A, "colon" }, /* COLON */
01781     { 0x003B, "semicolon" }, /* SEMICOLON */
01782     { 0x003C, "less" }, /* LESS-THAN SIGN */
01783     { 0x003D, "equal" }, /* EQUALS SIGN */
01784     { 0x003E, "greater" }, /* GREATER-THAN SIGN */
01785     { 0x003F, "question" }, /* QUESTION MARK */
01786     { 0x0040, "at" }, /* COMMERCIAL AT */
01787     { 0x0041, "A" }, /* LATIN CAPITAL LETTER A */
01788     { 0x0042, "B" }, /* LATIN CAPITAL LETTER B */
01789     { 0x0043, "C" }, /* LATIN CAPITAL LETTER C */
01790     { 0x0044, "D" }, /* LATIN CAPITAL LETTER D */
01791     { 0x0045, "E" }, /* LATIN CAPITAL LETTER E */
01792     { 0x0046, "F" }, /* LATIN CAPITAL LETTER F */
01793     { 0x0047, "G" }, /* LATIN CAPITAL LETTER G */
01794     { 0x0048, "H" }, /* LATIN CAPITAL LETTER H */
01795     { 0x0049, "I" }, /* LATIN CAPITAL LETTER I */
01796     { 0x004A, "J" }, /* LATIN CAPITAL LETTER J */
01797     { 0x004B, "K" }, /* LATIN CAPITAL LETTER K */
01798     { 0x004C, "L" }, /* LATIN CAPITAL LETTER L */
01799     { 0x004D, "M" }, /* LATIN CAPITAL LETTER M */
01800     { 0x004E, "N" }, /* LATIN CAPITAL LETTER N */
01801     { 0x004F, "O" }, /* LATIN CAPITAL LETTER O */
01802     { 0x0050, "P" }, /* LATIN CAPITAL LETTER P */
01803     { 0x0051, "Q" }, /* LATIN CAPITAL LETTER Q */
01804     { 0x0052, "R" }, /* LATIN CAPITAL LETTER R */
01805     { 0x0053, "S" }, /* LATIN CAPITAL LETTER S */
01806     { 0x0054, "T" }, /* LATIN CAPITAL LETTER T */
01807     { 0x0055, "U" }, /* LATIN CAPITAL LETTER U */
01808     { 0x0056, "V" }, /* LATIN CAPITAL LETTER V */
01809     { 0x0057, "W" }, /* LATIN CAPITAL LETTER W */
01810     { 0x0058, "X" }, /* LATIN CAPITAL LETTER X */
01811     { 0x0059, "Y" }, /* LATIN CAPITAL LETTER Y */
01812     { 0x005A, "Z" }, /* LATIN CAPITAL LETTER Z */
01813     { 0x005B, "bracketleft" }, /* LEFT SQUARE BRACKET */
01814     { 0x005C, "backslash" }, /* REVERSE SOLIDUS */
01815     { 0x005D, "bracketright" }, /* RIGHT SQUARE BRACKET */
01816     { 0x005E, "circumflex" }, /* CIRCUMFLEX ACCENT */   /* SU: renamed from asciicircum */
01817     { 0x005F, "underscore" }, /* LOW LINE */
01818     { 0x0060, "grave" }, /* GRAVE ACCENT */
01819     { 0x0061, "a" }, /* LATIN SMALL LETTER A */
01820     { 0x0062, "b" }, /* LATIN SMALL LETTER B */
01821     { 0x0063, "c" }, /* LATIN SMALL LETTER C */
01822     { 0x0064, "d" }, /* LATIN SMALL LETTER D */
01823     { 0x0065, "e" }, /* LATIN SMALL LETTER E */
01824     { 0x0066, "f" }, /* LATIN SMALL LETTER F */
01825     { 0x0067, "g" }, /* LATIN SMALL LETTER G */
01826     { 0x0068, "h" }, /* LATIN SMALL LETTER H */
01827     { 0x0069, "i" }, /* LATIN SMALL LETTER I */
01828     { 0x006A, "j" }, /* LATIN SMALL LETTER J */
01829     { 0x006B, "k" }, /* LATIN SMALL LETTER K */
01830     { 0x006C, "l" }, /* LATIN SMALL LETTER L */
01831     { 0x006D, "m" }, /* LATIN SMALL LETTER M */
01832     { 0x006E, "n" }, /* LATIN SMALL LETTER N */
01833     { 0x006F, "o" }, /* LATIN SMALL LETTER O */
01834     { 0x0070, "p" }, /* LATIN SMALL LETTER P */
01835     { 0x0071, "q" }, /* LATIN SMALL LETTER Q */
01836     { 0x0072, "r" }, /* LATIN SMALL LETTER R */
01837     { 0x0073, "s" }, /* LATIN SMALL LETTER S */
01838     { 0x0074, "t" }, /* LATIN SMALL LETTER T */
01839     { 0x0075, "u" }, /* LATIN SMALL LETTER U */
01840     { 0x0076, "v" }, /* LATIN SMALL LETTER V */
01841     { 0x0077, "w" }, /* LATIN SMALL LETTER W */
01842     { 0x0078, "x" }, /* LATIN SMALL LETTER X */
01843     { 0x0079, "y" }, /* LATIN SMALL LETTER Y */
01844     { 0x007A, "z" }, /* LATIN SMALL LETTER Z */
01845     { 0x007B, "braceleft" }, /* LEFT CURLY BRACKET */
01846     { 0x007C, "bar" }, /* VERTICAL LINE */
01847     { 0x007D, "braceright" }, /* RIGHT CURLY BRACKET */
01848     { 0x007E, "tilde" }, /* TILDE */                    /* SU: renamed from asciitilde */
01849     { 0x00A0, "$spacenobreak"  }, /* NO-BREAK SPACE; distinguish Adobe duplicates */
01850     { 0x00A1, "exclamdown" }, /* INVERTED EXCLAMATION MARK */
01851     { 0x00A2, "cent" }, /* CENT SIGN */
01852     { 0x00A3, "sterling" }, /* POUND SIGN */
01853     { 0x00A4, "currency" }, /* CURRENCY SIGN */
01854     { 0x00A5, "yen" }, /* YEN SIGN */
01855     { 0x00A6, "brokenbar" }, /* BROKEN BAR */
01856     { 0x00A7, "section" }, /* SECTION SIGN */
01857     { 0x00A8, "dieresis" }, /* DIAERESIS */
01858     { 0x00A9, "copyright" }, /* COPYRIGHT SIGN */
01859     { 0x00AA, "ordfeminine" }, /* FEMININE ORDINAL INDICATOR */
01860     { 0x00AB, "guillemotleft" }, /* LEFT-POINTING DOUBLE ANGLE QUOTATION MARK */
01861     { 0x00AC, "logicalnot" }, /* NOT SIGN */
01862     { 0x00AD, "$hyphensoft"  }, /* SOFT HYPHEN; distinguish Adobe duplicates */
01863     { 0x00AE, "registered" }, /* REGISTERED SIGN */
01864     { 0x00AF, "macron" }, /* MACRON */
01865     { 0x00AF, "$macron" }, /* MACRON; distinguish Adobe duplicates */
01866     { 0x00B0, "degree" }, /* DEGREE SIGN */
01867     { 0x00B1, "plusminus" }, /* PLUS-MINUS SIGN */
01868     { 0x00B2, "twosuperior" }, /* SUPERSCRIPT TWO */
01869     { 0x00B3, "threesuperior" }, /* SUPERSCRIPT THREE */
01870     { 0x00B4, "acute" }, /* ACUTE ACCENT */
01871     { 0x00B5, "$micro" }, /* MICRO SIGN; distinguish Adobe duplicates */
01872     { 0x00B5, "mu" }, /* MICRO SIGN */
01873     { 0x00B6, "paragraph" }, /* PILCROW SIGN */
01874     { 0x00B7, "periodcentered" }, /* MIDDLE DOT */
01875     { 0x00B7, "$periodcentered"  }, /* MIDDLE DOT; distinguish Adobe duplicates */
01876     { 0x00B8, "cedilla" }, /* CEDILLA */
01877     { 0x00B9, "onesuperior" }, /* SUPERSCRIPT ONE */
01878     { 0x00BA, "ordmasculine" }, /* MASCULINE ORDINAL INDICATOR */
01879     { 0x00BB, "guillemotright" }, /* RIGHT-POINTING DOUBLE ANGLE QUOTATION MARK */
01880     { 0x00BC, "onequarter" }, /* VULGAR FRACTION ONE QUARTER */
01881     { 0x00BD, "onehalf" }, /* VULGAR FRACTION ONE HALF */
01882     { 0x00BE, "threequarters" }, /* VULGAR FRACTION THREE QUARTERS */
01883     { 0x00BF, "questiondown" }, /* INVERTED QUESTION MARK */
01884     { 0x00C0, "Agrave" }, /* LATIN CAPITAL LETTER A WITH GRAVE */
01885     { 0x00C1, "Aacute" }, /* LATIN CAPITAL LETTER A WITH ACUTE */
01886     { 0x00C2, "Acircumflex" }, /* LATIN CAPITAL LETTER A WITH CIRCUMFLEX */
01887     { 0x00C3, "Atilde" }, /* LATIN CAPITAL LETTER A WITH TILDE */
01888     { 0x00C4, "Adieresis" }, /* LATIN CAPITAL LETTER A WITH DIAERESIS */
01889     { 0x00C5, "Aring" }, /* LATIN CAPITAL LETTER A WITH RING ABOVE */
01890     { 0x00C6, "AE" }, /* LATIN CAPITAL LETTER AE */
01891     { 0x00C7, "Ccedilla" }, /* LATIN CAPITAL LETTER C WITH CEDILLA */
01892     { 0x00C8, "Egrave" }, /* LATIN CAPITAL LETTER E WITH GRAVE */
01893     { 0x00C9, "Eacute" }, /* LATIN CAPITAL LETTER E WITH ACUTE */
01894     { 0x00CA, "Ecircumflex" }, /* LATIN CAPITAL LETTER E WITH CIRCUMFLEX */
01895     { 0x00CB, "Edieresis" }, /* LATIN CAPITAL LETTER E WITH DIAERESIS */
01896     { 0x00CC, "Igrave" }, /* LATIN CAPITAL LETTER I WITH GRAVE */
01897     { 0x00CD, "Iacute" }, /* LATIN CAPITAL LETTER I WITH ACUTE */
01898     { 0x00CE, "Icircumflex" }, /* LATIN CAPITAL LETTER I WITH CIRCUMFLEX */
01899     { 0x00CF, "Idieresis" }, /* LATIN CAPITAL LETTER I WITH DIAERESIS */
01900     { 0x00D0, "Eth" }, /* LATIN CAPITAL LETTER ETH */
01901     { 0x00D1, "Ntilde" }, /* LATIN CAPITAL LETTER N WITH TILDE */
01902     { 0x00D2, "Ograve" }, /* LATIN CAPITAL LETTER O WITH GRAVE */
01903     { 0x00D3, "Oacute" }, /* LATIN CAPITAL LETTER O WITH ACUTE */
01904     { 0x00D4, "Ocircumflex" }, /* LATIN CAPITAL LETTER O WITH CIRCUMFLEX */
01905     { 0x00D5, "Otilde" }, /* LATIN CAPITAL LETTER O WITH TILDE */
01906     { 0x00D6, "Odieresis" }, /* LATIN CAPITAL LETTER O WITH DIAERESIS */
01907     { 0x00D7, "multiply" }, /* MULTIPLICATION SIGN */
01908     { 0x00D8, "Oslash" }, /* LATIN CAPITAL LETTER O WITH STROKE */
01909     { 0x00D9, "Ugrave" }, /* LATIN CAPITAL LETTER U WITH GRAVE */
01910     { 0x00DA, "Uacute" }, /* LATIN CAPITAL LETTER U WITH ACUTE */
01911     { 0x00DB, "Ucircumflex" }, /* LATIN CAPITAL LETTER U WITH CIRCUMFLEX */
01912     { 0x00DC, "Udieresis" }, /* LATIN CAPITAL LETTER U WITH DIAERESIS */
01913     { 0x00DD, "Yacute" }, /* LATIN CAPITAL LETTER Y WITH ACUTE */
01914     { 0x00DE, "Thorn" }, /* LATIN CAPITAL LETTER THORN */
01915     { 0x00DF, "germandbls" }, /* LATIN SMALL LETTER SHARP S */
01916     { 0x00E0, "agrave" }, /* LATIN SMALL LETTER A WITH GRAVE */
01917     { 0x00E1, "aacute" }, /* LATIN SMALL LETTER A WITH ACUTE */
01918     { 0x00E2, "acircumflex" }, /* LATIN SMALL LETTER A WITH CIRCUMFLEX */
01919     { 0x00E3, "atilde" }, /* LATIN SMALL LETTER A WITH TILDE */
01920     { 0x00E4, "adieresis" }, /* LATIN SMALL LETTER A WITH DIAERESIS */
01921     { 0x00E5, "aring" }, /* LATIN SMALL LETTER A WITH RING ABOVE */
01922     { 0x00E6, "ae" }, /* LATIN SMALL LETTER AE */
01923     { 0x00E7, "ccedilla" }, /* LATIN SMALL LETTER C WITH CEDILLA */
01924     { 0x00E8, "egrave" }, /* LATIN SMALL LETTER E WITH GRAVE */
01925     { 0x00E9, "eacute" }, /* LATIN SMALL LETTER E WITH ACUTE */
01926     { 0x00EA, "ecircumflex" }, /* LATIN SMALL LETTER E WITH CIRCUMFLEX */
01927     { 0x00EB, "edieresis" }, /* LATIN SMALL LETTER E WITH DIAERESIS */
01928     { 0x00EC, "igrave" }, /* LATIN SMALL LETTER I WITH GRAVE */
01929     { 0x00ED, "iacute" }, /* LATIN SMALL LETTER I WITH ACUTE */
01930     { 0x00EE, "icircumflex" }, /* LATIN SMALL LETTER I WITH CIRCUMFLEX */
01931     { 0x00EF, "idieresis" }, /* LATIN SMALL LETTER I WITH DIAERESIS */
01932     { 0x00F0, "eth" }, /* LATIN SMALL LETTER ETH */
01933     { 0x00F1, "ntilde" }, /* LATIN SMALL LETTER N WITH TILDE */
01934     { 0x00F2, "ograve" }, /* LATIN SMALL LETTER O WITH GRAVE */
01935     { 0x00F3, "oacute" }, /* LATIN SMALL LETTER O WITH ACUTE */
01936     { 0x00F4, "ocircumflex" }, /* LATIN SMALL LETTER O WITH CIRCUMFLEX */
01937     { 0x00F5, "otilde" }, /* LATIN SMALL LETTER O WITH TILDE */
01938     { 0x00F6, "odieresis" }, /* LATIN SMALL LETTER O WITH DIAERESIS */
01939     { 0x00F7, "divide" }, /* DIVISION SIGN */
01940     { 0x00F8, "oslash" }, /* LATIN SMALL LETTER O WITH STROKE */
01941     { 0x00F9, "ugrave" }, /* LATIN SMALL LETTER U WITH GRAVE */
01942     { 0x00FA, "uacute" }, /* LATIN SMALL LETTER U WITH ACUTE */
01943     { 0x00FB, "ucircumflex" }, /* LATIN SMALL LETTER U WITH CIRCUMFLEX */
01944     { 0x00FC, "udieresis" }, /* LATIN SMALL LETTER U WITH DIAERESIS */
01945     { 0x00FD, "yacute" }, /* LATIN SMALL LETTER Y WITH ACUTE */
01946     { 0x00FE, "thorn" }, /* LATIN SMALL LETTER THORN */
01947     { 0x00FF, "ydieresis" }, /* LATIN SMALL LETTER Y WITH DIAERESIS */
01948     { 0x0100, "Amacron" }, /* LATIN CAPITAL LETTER A WITH MACRON */
01949     { 0x0101, "amacron" }, /* LATIN SMALL LETTER A WITH MACRON */
01950     { 0x0102, "Abreve" }, /* LATIN CAPITAL LETTER A WITH BREVE */
01951     { 0x0103, "abreve" }, /* LATIN SMALL LETTER A WITH BREVE */
01952     { 0x0104, "Aogonek" }, /* LATIN CAPITAL LETTER A WITH OGONEK */
01953     { 0x0105, "aogonek" }, /* LATIN SMALL LETTER A WITH OGONEK */
01954     { 0x0106, "Cacute" }, /* LATIN CAPITAL LETTER C WITH ACUTE */
01955     { 0x0107, "cacute" }, /* LATIN SMALL LETTER C WITH ACUTE */
01956     { 0x0108, "Ccircumflex" }, /* LATIN CAPITAL LETTER C WITH CIRCUMFLEX */
01957     { 0x0109, "ccircumflex" }, /* LATIN SMALL LETTER C WITH CIRCUMFLEX */
01958     { 0x010A, "Cdotaccent" }, /* LATIN CAPITAL LETTER C WITH DOT ABOVE */
01959     { 0x010B, "cdotaccent" }, /* LATIN SMALL LETTER C WITH DOT ABOVE */
01960     { 0x010C, "Ccaron" }, /* LATIN CAPITAL LETTER C WITH CARON */
01961     { 0x010D, "ccaron" }, /* LATIN SMALL LETTER C WITH CARON */
01962     { 0x010E, "Dcaron" }, /* LATIN CAPITAL LETTER D WITH CARON */
01963     { 0x010F, "dcaron" }, /* LATIN SMALL LETTER D WITH CARON */
01964     { 0x0110, "Dcroat" }, /* LATIN CAPITAL LETTER D WITH STROKE */
01965     { 0x0111, "dcroat" }, /* LATIN SMALL LETTER D WITH STROKE */
01966     { 0x0112, "Emacron" }, /* LATIN CAPITAL LETTER E WITH MACRON */
01967     { 0x0113, "emacron" }, /* LATIN SMALL LETTER E WITH MACRON */
01968     { 0x0114, "Ebreve" }, /* LATIN CAPITAL LETTER E WITH BREVE */
01969     { 0x0115, "ebreve" }, /* LATIN SMALL LETTER E WITH BREVE */
01970     { 0x0116, "Edotaccent" }, /* LATIN CAPITAL LETTER E WITH DOT ABOVE */
01971     { 0x0117, "edotaccent" }, /* LATIN SMALL LETTER E WITH DOT ABOVE */
01972     { 0x0118, "Eogonek" }, /* LATIN CAPITAL LETTER E WITH OGONEK */
01973     { 0x0119, "eogonek" }, /* LATIN SMALL LETTER E WITH OGONEK */
01974     { 0x011A, "Ecaron" }, /* LATIN CAPITAL LETTER E WITH CARON */
01975     { 0x011B, "ecaron" }, /* LATIN SMALL LETTER E WITH CARON */
01976     { 0x011C, "Gcircumflex" }, /* LATIN CAPITAL LETTER G WITH CIRCUMFLEX */
01977     { 0x011D, "gcircumflex" }, /* LATIN SMALL LETTER G WITH CIRCUMFLEX */
01978     { 0x011E, "Gbreve" }, /* LATIN CAPITAL LETTER G WITH BREVE */
01979     { 0x011F, "gbreve" }, /* LATIN SMALL LETTER G WITH BREVE */
01980     { 0x0120, "Gdotaccent" }, /* LATIN CAPITAL LETTER G WITH DOT ABOVE */
01981     { 0x0121, "gdotaccent" }, /* LATIN SMALL LETTER G WITH DOT ABOVE */
01982     { 0x0122, "Gcommaaccent" }, /* LATIN CAPITAL LETTER G WITH CEDILLA */
01983     { 0x0123, "gcommaaccent" }, /* LATIN SMALL LETTER G WITH CEDILLA */
01984     { 0x0124, "Hcircumflex" }, /* LATIN CAPITAL LETTER H WITH CIRCUMFLEX */
01985     { 0x0125, "hcircumflex" }, /* LATIN SMALL LETTER H WITH CIRCUMFLEX */
01986     { 0x0126, "Hbar" }, /* LATIN CAPITAL LETTER H WITH STROKE */
01987     { 0x0127, "hbar" }, /* LATIN SMALL LETTER H WITH STROKE */
01988     { 0x0128, "Itilde" }, /* LATIN CAPITAL LETTER I WITH TILDE */
01989     { 0x0129, "itilde" }, /* LATIN SMALL LETTER I WITH TILDE */
01990     { 0x012A, "Imacron" }, /* LATIN CAPITAL LETTER I WITH MACRON */
01991     { 0x012B, "imacron" }, /* LATIN SMALL LETTER I WITH MACRON */
01992     { 0x012C, "Ibreve" }, /* LATIN CAPITAL LETTER I WITH BREVE */
01993     { 0x012D, "ibreve" }, /* LATIN SMALL LETTER I WITH BREVE */
01994     { 0x012E, "Iogonek" }, /* LATIN CAPITAL LETTER I WITH OGONEK */
01995     { 0x012F, "iogonek" }, /* LATIN SMALL LETTER I WITH OGONEK */
01996     { 0x0130, "Idotaccent" }, /* LATIN CAPITAL LETTER I WITH DOT ABOVE */
01997     { 0x0131, "dotlessi" }, /* LATIN SMALL LETTER DOTLESS I */
01998     { 0x0132, "IJ" }, /* LATIN CAPITAL LIGATURE IJ */
01999     { 0x0133, "ij" }, /* LATIN SMALL LIGATURE IJ */
02000     { 0x0134, "Jcircumflex" }, /* LATIN CAPITAL LETTER J WITH CIRCUMFLEX */
02001     { 0x0135, "jcircumflex" }, /* LATIN SMALL LETTER J WITH CIRCUMFLEX */
02002     { 0x0136, "Kcommaaccent" }, /* LATIN CAPITAL LETTER K WITH CEDILLA */
02003     { 0x0137, "kcommaaccent" }, /* LATIN SMALL LETTER K WITH CEDILLA */
02004     { 0x0138, "kgreenlandic" }, /* LATIN SMALL LETTER KRA */
02005     { 0x0139, "Lacute" }, /* LATIN CAPITAL LETTER L WITH ACUTE */
02006     { 0x013A, "lacute" }, /* LATIN SMALL LETTER L WITH ACUTE */
02007     { 0x013B, "Lcommaaccent" }, /* LATIN CAPITAL LETTER L WITH CEDILLA */
02008     { 0x013C, "lcommaaccent" }, /* LATIN SMALL LETTER L WITH CEDILLA */
02009     { 0x013D, "Lcaron" }, /* LATIN CAPITAL LETTER L WITH CARON */
02010     { 0x013E, "lcaron" }, /* LATIN SMALL LETTER L WITH CARON */
02011     { 0x013F, "Ldot" }, /* LATIN CAPITAL LETTER L WITH MIDDLE DOT */
02012     { 0x0140, "ldot" }, /* LATIN SMALL LETTER L WITH MIDDLE DOT */
02013     { 0x0141, "Lslash" }, /* LATIN CAPITAL LETTER L WITH STROKE */
02014     { 0x0142, "lslash" }, /* LATIN SMALL LETTER L WITH STROKE */
02015     { 0x0143, "Nacute" }, /* LATIN CAPITAL LETTER N WITH ACUTE */
02016     { 0x0144, "nacute" }, /* LATIN SMALL LETTER N WITH ACUTE */
02017     { 0x0145, "Ncommaaccent" }, /* LATIN CAPITAL LETTER N WITH CEDILLA */
02018     { 0x0146, "ncommaaccent" }, /* LATIN SMALL LETTER N WITH CEDILLA */
02019     { 0x0147, "Ncaron" }, /* LATIN CAPITAL LETTER N WITH CARON */
02020     { 0x0148, "ncaron" }, /* LATIN SMALL LETTER N WITH CARON */
02021     { 0x0149, "napostrophe" }, /* LATIN SMALL LETTER N PRECEDED BY APOSTROPHE */
02022     { 0x014A, "Eng" }, /* LATIN CAPITAL LETTER ENG */
02023     { 0x014B, "eng" }, /* LATIN SMALL LETTER ENG */
02024     { 0x014C, "Omacron" }, /* LATIN CAPITAL LETTER O WITH MACRON */
02025     { 0x014D, "omacron" }, /* LATIN SMALL LETTER O WITH MACRON */
02026     { 0x014E, "Obreve" }, /* LATIN CAPITAL LETTER O WITH BREVE */
02027     { 0x014F, "obreve" }, /* LATIN SMALL LETTER O WITH BREVE */
02028     { 0x0150, "Ohungarumlaut" }, /* LATIN CAPITAL LETTER O WITH DOUBLE ACUTE */
02029     { 0x0151, "ohungarumlaut" }, /* LATIN SMALL LETTER O WITH DOUBLE ACUTE */
02030     { 0x0152, "OE" }, /* LATIN CAPITAL LIGATURE OE */
02031     { 0x0153, "oe" }, /* LATIN SMALL LIGATURE OE */
02032     { 0x0154, "Racute" }, /* LATIN CAPITAL LETTER R WITH ACUTE */
02033     { 0x0155, "racute" }, /* LATIN SMALL LETTER R WITH ACUTE */
02034     { 0x0156, "Rcommaaccent" }, /* LATIN CAPITAL LETTER R WITH CEDILLA */
02035     { 0x0157, "rcommaaccent" }, /* LATIN SMALL LETTER R WITH CEDILLA */
02036     { 0x0158, "Rcaron" }, /* LATIN CAPITAL LETTER R WITH CARON */
02037     { 0x0159, "rcaron" }, /* LATIN SMALL LETTER R WITH CARON */
02038     { 0x015A, "Sacute" }, /* LATIN CAPITAL LETTER S WITH ACUTE */
02039     { 0x015B, "sacute" }, /* LATIN SMALL LETTER S WITH ACUTE */
02040     { 0x015C, "Scircumflex" }, /* LATIN CAPITAL LETTER S WITH CIRCUMFLEX */
02041     { 0x015D, "scircumflex" }, /* LATIN SMALL LETTER S WITH CIRCUMFLEX */
02042     { 0x015E, "Scedilla" }, /* LATIN CAPITAL LETTER S WITH CEDILLA */
02043     { 0x015E, "$Scedilla"  }, /* LATIN CAPITAL LETTER S WITH CEDILLA; distinguish Adobe duplicates */
02044     { 0x015F, "scedilla" }, /* LATIN SMALL LETTER S WITH CEDILLA */
02045     { 0x015F, "$scedilla"  }, /* LATIN SMALL LETTER S WITH CEDILLA; distinguish Adobe duplicates */
02046     { 0x0160, "Scaron" }, /* LATIN CAPITAL LETTER S WITH CARON */
02047     { 0x0161, "scaron" }, /* LATIN SMALL LETTER S WITH CARON */
02048     { 0x0162, "$Tcedilla" }, /* LATIN CAPITAL LETTER T WITH CEDILLA; distinguish Adobe duplicates */
02049     { 0x0162, "Tcommaaccent" }, /* LATIN CAPITAL LETTER T WITH CEDILLA */
02050     { 0x0163, "$tcedilla" }, /* LATIN SMALL LETTER T WITH CEDILLA; distinguish Adobe duplicates */
02051     { 0x0163, "tcommaaccent" }, /* LATIN SMALL LETTER T WITH CEDILLA */
02052     { 0x0164, "Tcaron" }, /* LATIN CAPITAL LETTER T WITH CARON */
02053     { 0x0165, "tcaron" }, /* LATIN SMALL LETTER T WITH CARON */
02054     { 0x0166, "Tbar" }, /* LATIN CAPITAL LETTER T WITH STROKE */
02055     { 0x0167, "tbar" }, /* LATIN SMALL LETTER T WITH STROKE */
02056     { 0x0168, "Utilde" }, /* LATIN CAPITAL LETTER U WITH TILDE */
02057     { 0x0169, "utilde" }, /* LATIN SMALL LETTER U WITH TILDE */
02058     { 0x016A, "Umacron" }, /* LATIN CAPITAL LETTER U WITH MACRON */
02059     { 0x016B, "umacron" }, /* LATIN SMALL LETTER U WITH MACRON */
02060     { 0x016C, "Ubreve" }, /* LATIN CAPITAL LETTER U WITH BREVE */
02061     { 0x016D, "ubreve" }, /* LATIN SMALL LETTER U WITH BREVE */
02062     { 0x016E, "Uring" }, /* LATIN CAPITAL LETTER U WITH RING ABOVE */
02063     { 0x016F, "uring" }, /* LATIN SMALL LETTER U WITH RING ABOVE */
02064     { 0x0170, "Uhungarumlaut" }, /* LATIN CAPITAL LETTER U WITH DOUBLE ACUTE */
02065     { 0x0171, "uhungarumlaut" }, /* LATIN SMALL LETTER U WITH DOUBLE ACUTE */
02066     { 0x0172, "Uogonek" }, /* LATIN CAPITAL LETTER U WITH OGONEK */
02067     { 0x0173, "uogonek" }, /* LATIN SMALL LETTER U WITH OGONEK */
02068     { 0x0174, "Wcircumflex" }, /* LATIN CAPITAL LETTER W WITH CIRCUMFLEX */
02069     { 0x0175, "wcircumflex" }, /* LATIN SMALL LETTER W WITH CIRCUMFLEX */
02070     { 0x0176, "Ycircumflex" }, /* LATIN CAPITAL LETTER Y WITH CIRCUMFLEX */
02071     { 0x0177, "ycircumflex" }, /* LATIN SMALL LETTER Y WITH CIRCUMFLEX */
02072     { 0x0178, "Ydieresis" }, /* LATIN CAPITAL LETTER Y WITH DIAERESIS */
02073     { 0x0179, "Zacute" }, /* LATIN CAPITAL LETTER Z WITH ACUTE */
02074     { 0x017A, "zacute" }, /* LATIN SMALL LETTER Z WITH ACUTE */
02075     { 0x017B, "Zdotaccent" }, /* LATIN CAPITAL LETTER Z WITH DOT ABOVE */
02076     { 0x017C, "zdotaccent" }, /* LATIN SMALL LETTER Z WITH DOT ABOVE */
02077     { 0x017D, "Zcaron" }, /* LATIN CAPITAL LETTER Z WITH CARON */
02078     { 0x017E, "zcaron" }, /* LATIN SMALL LETTER Z WITH CARON */
02079     { 0x017F, "longs" }, /* LATIN SMALL LETTER LONG S */
02080     { 0x0192, "florin" }, /* LATIN SMALL LETTER F WITH HOOK */
02081     { 0x01A0, "Ohorn" }, /* LATIN CAPITAL LETTER O WITH HORN */
02082     { 0x01A1, "ohorn" }, /* LATIN SMALL LETTER O WITH HORN */
02083     { 0x01AF, "Uhorn" }, /* LATIN CAPITAL LETTER U WITH HORN */
02084     { 0x01B0, "uhorn" }, /* LATIN SMALL LETTER U WITH HORN */
02085     { 0x01E6, "Gcaron" }, /* LATIN CAPITAL LETTER G WITH CARON */
02086     { 0x01E7, "gcaron" }, /* LATIN SMALL LETTER G WITH CARON */
02087     { 0x01FA, "Aringacute" }, /* LATIN CAPITAL LETTER A WITH RING ABOVE AND ACUTE */
02088     { 0x01FB, "aringacute" }, /* LATIN SMALL LETTER A WITH RING ABOVE AND ACUTE */
02089     { 0x01FC, "AEacute" }, /* LATIN CAPITAL LETTER AE WITH ACUTE */
02090     { 0x01FD, "aeacute" }, /* LATIN SMALL LETTER AE WITH ACUTE */
02091     { 0x01FE, "Oslashacute" }, /* LATIN CAPITAL LETTER O WITH STROKE AND ACUTE */
02092     { 0x01FF, "oslashacute" }, /* LATIN SMALL LETTER O WITH STROKE AND ACUTE */
02093     { 0x0218, "Scommaaccent" }, /* LATIN CAPITAL LETTER S WITH COMMA BELOW */
02094     { 0x0219, "scommaaccent" }, /* LATIN SMALL LETTER S WITH COMMA BELOW */
02095     { 0x021A, "$Tcommaaccent" }, /* LATIN CAPITAL LETTER T WITH COMMA BELOW; distinguish Adobe duplicates */
02096     { 0x021B, "$tcommaaccent" }, /* LATIN SMALL LETTER T WITH COMMA BELOW; distinguish Adobe duplicates */
02097     { 0x02BC, "afii57929" }, /* MODIFIER LETTER APOSTROPHE */
02098     { 0x02BD, "afii64937" }, /* MODIFIER LETTER REVERSED COMMA */
02099     { 0x02C6, "circumflex" }, /* MODIFIER LETTER CIRCUMFLEX ACCENT */
02100     { 0x02C7, "caron" }, /* CARON */
02101     { 0x02C9, "$macronmodifier" }, /* MODIFIER LETTER MACRON */
02102     { 0x02CA, "$acutemodifier" }, /* MODIFIER LETTER ACUTE ACCENT */
02103     { 0x02CB, "$gravemodifier" }, /* MODIFIER LETTER GRAVE ACCENT */
02104     { 0x02D8, "breve" }, /* BREVE */
02105     { 0x02D9, "dotaccent" }, /* DOT ABOVE */
02106     { 0x02DA, "ring" }, /* RING ABOVE */
02107     { 0x02DB, "ogonek" }, /* OGONEK */
02108     { 0x02DC, "tilde" }, /* SMALL TILDE */
02109     { 0x02DD, "hungarumlaut" }, /* DOUBLE ACUTE ACCENT */
02110     { 0x0300, "gravecomb" }, /* COMBINING GRAVE ACCENT */
02111     { 0x0301, "acutecomb" }, /* COMBINING ACUTE ACCENT */
02112     { 0x0302, "$circumflexcomb" }, /* COMBINING CIRCUMFLEX ACCENT */
02113     { 0x0303, "tildecomb" }, /* COMBINING TILDE */
02114     { 0x0304, "$macroncomb" }, /* COMBINING MACRON */
02115     { 0x0305, "$overlinecomb" }, /* COMBINING OVERLINE */
02116     { 0x0306, "$brevecomb" }, /* COMBINING BREVE */
02117     { 0x0307, "$dotaccentcomb" }, /* COMBINING DOT ABOVE */
02118     { 0x0308, "$dieresiscomb" }, /* COMBINING DIAERESIS */
02119     { 0x0309, "hookabovecomb" }, /* COMBINING HOOK ABOVE */
02120     { 0x030A, "$ringcomb" }, /* COMBINING RING ABOVE */
02121     { 0x030C, "$caroncomb" }, /* COMBINING CARON */
02122     { 0x0323, "dotbelowcomb" }, /* COMBINING DOT BELOW */
02123     { 0x0327, "$cedillacomb" }, /* COMBINING CEDILLA */
02124     { 0x0328, "$ogonekcomb" }, /* COMBINING OGONEK */
02125     { 0x0338, "$slashlongcomb" }, /* COMBINING LONG SOLIDUS OVERLAY */
02126     { 0x0384, "tonos" }, /* GREEK TONOS */
02127     { 0x0385, "dieresistonos" }, /* GREEK DIALYTIKA TONOS */
02128     { 0x0386, "Alphatonos" }, /* GREEK CAPITAL LETTER ALPHA WITH TONOS */
02129     { 0x0387, "anoteleia" }, /* GREEK ANO TELEIA */
02130     { 0x0388, "Epsilontonos" }, /* GREEK CAPITAL LETTER EPSILON WITH TONOS */
02131     { 0x0389, "Etatonos" }, /* GREEK CAPITAL LETTER ETA WITH TONOS */
02132     { 0x038A, "Iotatonos" }, /* GREEK CAPITAL LETTER IOTA WITH TONOS */
02133     { 0x038C, "Omicrontonos" }, /* GREEK CAPITAL LETTER OMICRON WITH TONOS */
02134     { 0x038E, "Upsilontonos" }, /* GREEK CAPITAL LETTER UPSILON WITH TONOS */
02135     { 0x038F, "Omegatonos" }, /* GREEK CAPITAL LETTER OMEGA WITH TONOS */
02136     { 0x0390, "iotadieresistonos" }, /* GREEK SMALL LETTER IOTA WITH DIALYTIKA AND TONOS */
02137     { 0x0391, "Alpha" }, /* GREEK CAPITAL LETTER ALPHA */
02138     { 0x0392, "Beta" }, /* GREEK CAPITAL LETTER BETA */
02139     { 0x0393, "Gamma" }, /* GREEK CAPITAL LETTER GAMMA */
02140     { 0x0394, "$Delta"  }, /* GREEK CAPITAL LETTER DELTA; distinguish Adobe duplicates */
02141     { 0x0395, "Epsilon" }, /* GREEK CAPITAL LETTER EPSILON */
02142     { 0x0396, "Zeta" }, /* GREEK CAPITAL LETTER ZETA */
02143     { 0x0397, "Eta" }, /* GREEK CAPITAL LETTER ETA */
02144     { 0x0398, "Theta" }, /* GREEK CAPITAL LETTER THETA */
02145     { 0x0399, "Iota" }, /* GREEK CAPITAL LETTER IOTA */
02146     { 0x039A, "Kappa" }, /* GREEK CAPITAL LETTER KAPPA */
02147     { 0x039B, "Lambda" }, /* GREEK CAPITAL LETTER LAMDA */
02148     { 0x039C, "Mu" }, /* GREEK CAPITAL LETTER MU */
02149     { 0x039D, "Nu" }, /* GREEK CAPITAL LETTER NU */
02150     { 0x039E, "Xi" }, /* GREEK CAPITAL LETTER XI */
02151     { 0x039F, "Omicron" }, /* GREEK CAPITAL LETTER OMICRON */
02152     { 0x03A0, "Pi" }, /* GREEK CAPITAL LETTER PI */
02153     { 0x03A1, "Rho" }, /* GREEK CAPITAL LETTER RHO */
02154     { 0x03A3, "Sigma" }, /* GREEK CAPITAL LETTER SIGMA */
02155     { 0x03A4, "Tau" }, /* GREEK CAPITAL LETTER TAU */
02156     { 0x03A5, "Upsilon" }, /* GREEK CAPITAL LETTER UPSILON */
02157     { 0x03A6, "Phi" }, /* GREEK CAPITAL LETTER PHI */
02158     { 0x03A7, "Chi" }, /* GREEK CAPITAL LETTER CHI */
02159     { 0x03A8, "Psi" }, /* GREEK CAPITAL LETTER PSI */
02160     { 0x03A9, "$Omega"  }, /* GREEK CAPITAL LETTER OMEGA; distinguish Adobe duplicates */
02161     { 0x03AA, "Iotadieresis" }, /* GREEK CAPITAL LETTER IOTA WITH DIALYTIKA */
02162     { 0x03AB, "Upsilondieresis" }, /* GREEK CAPITAL LETTER UPSILON WITH DIALYTIKA */
02163     { 0x03AC, "alphatonos" }, /* GREEK SMALL LETTER ALPHA WITH TONOS */
02164     { 0x03AD, "epsilontonos" }, /* GREEK SMALL LETTER EPSILON WITH TONOS */
02165     { 0x03AE, "etatonos" }, /* GREEK SMALL LETTER ETA WITH TONOS */
02166     { 0x03AF, "iotatonos" }, /* GREEK SMALL LETTER IOTA WITH TONOS */
02167     { 0x03B0, "upsilondieresistonos" }, /* GREEK SMALL LETTER UPSILON WITH DIALYTIKA AND TONOS */
02168     { 0x03B1, "alpha" }, /* GREEK SMALL LETTER ALPHA */
02169     { 0x03B2, "beta" }, /* GREEK SMALL LETTER BETA */
02170     { 0x03B3, "gamma" }, /* GREEK SMALL LETTER GAMMA */
02171     { 0x03B4, "delta" }, /* GREEK SMALL LETTER DELTA */
02172     { 0x03B5, "epsilon" }, /* GREEK SMALL LETTER EPSILON */
02173     { 0x03B6, "zeta" }, /* GREEK SMALL LETTER ZETA */
02174     { 0x03B7, "eta" }, /* GREEK SMALL LETTER ETA */
02175     { 0x03B8, "theta" }, /* GREEK SMALL LETTER THETA */
02176     { 0x03B9, "iota" }, /* GREEK SMALL LETTER IOTA */
02177     { 0x03BA, "kappa" }, /* GREEK SMALL LETTER KAPPA */
02178     { 0x03BB, "lambda" }, /* GREEK SMALL LETTER LAMDA */
02179     { 0x03BC, "$mu" }, /* GREEK SMALL LETTER MU; distinguish Adobe duplicates */
02180     { 0x03BD, "nu" }, /* GREEK SMALL LETTER NU */
02181     { 0x03BE, "xi" }, /* GREEK SMALL LETTER XI */
02182     { 0x03BF, "omicron" }, /* GREEK SMALL LETTER OMICRON */
02183     { 0x03C0, "pi" }, /* GREEK SMALL LETTER PI */
02184     { 0x03C1, "rho" }, /* GREEK SMALL LETTER RHO */
02185     { 0x03C2, "sigma1" }, /* GREEK SMALL LETTER FINAL SIGMA */
02186     { 0x03C3, "sigma" }, /* GREEK SMALL LETTER SIGMA */
02187     { 0x03C4, "tau" }, /* GREEK SMALL LETTER TAU */
02188     { 0x03C5, "upsilon" }, /* GREEK SMALL LETTER UPSILON */
02189     { 0x03C6, "phi" }, /* GREEK SMALL LETTER PHI */
02190     { 0x03C7, "chi" }, /* GREEK SMALL LETTER CHI */
02191     { 0x03C8, "psi" }, /* GREEK SMALL LETTER PSI */
02192     { 0x03C9, "omega" }, /* GREEK SMALL LETTER OMEGA */
02193     { 0x03CA, "iotadieresis" }, /* GREEK SMALL LETTER IOTA WITH DIALYTIKA */
02194     { 0x03CB, "upsilondieresis" }, /* GREEK SMALL LETTER UPSILON WITH DIALYTIKA */
02195     { 0x03CC, "omicrontonos" }, /* GREEK SMALL LETTER OMICRON WITH TONOS */
02196     { 0x03CD, "upsilontonos" }, /* GREEK SMALL LETTER UPSILON WITH TONOS */
02197     { 0x03CE, "omegatonos" }, /* GREEK SMALL LETTER OMEGA WITH TONOS */
02198     { 0x03D1, "theta1" }, /* GREEK THETA SYMBOL */
02199     { 0x03D2, "Upsilon1" }, /* GREEK UPSILON WITH HOOK SYMBOL */
02200     { 0x03D5, "phi1" }, /* GREEK PHI SYMBOL */
02201     { 0x03D6, "omega1" }, /* GREEK PI SYMBOL */
02202     { 0x03D6, "$pi1" }, /* GREEK PI SYMBOL; Adobe has this as "omega1" which is too confusing */
02203     { 0x03F1, "$rho1" }, /* GREEK RHO SYMBOL */
02204     { 0x03F5, "$epsilon1" }, /* GREEK LUNATE EPSILON SYMBOL */
02205     { 0x0401, "afii10023" }, /* CYRILLIC CAPITAL LETTER IO */
02206     { 0x0402, "afii10051" }, /* CYRILLIC CAPITAL LETTER DJE */
02207     { 0x0403, "afii10052" }, /* CYRILLIC CAPITAL LETTER GJE */
02208     { 0x0404, "afii10053" }, /* CYRILLIC CAPITAL LETTER UKRAINIAN IE */
02209     { 0x0405, "afii10054" }, /* CYRILLIC CAPITAL LETTER DZE */
02210     { 0x0406, "afii10055" }, /* CYRILLIC CAPITAL LETTER BYELORUSSIAN-UKRAINIAN I */
02211     { 0x0407, "afii10056" }, /* CYRILLIC CAPITAL LETTER YI */
02212     { 0x0408, "afii10057" }, /* CYRILLIC CAPITAL LETTER JE */
02213     { 0x0409, "afii10058" }, /* CYRILLIC CAPITAL LETTER LJE */
02214     { 0x040A, "afii10059" }, /* CYRILLIC CAPITAL LETTER NJE */
02215     { 0x040B, "afii10060" }, /* CYRILLIC CAPITAL LETTER TSHE */
02216     { 0x040C, "afii10061" }, /* CYRILLIC CAPITAL LETTER KJE */
02217     { 0x040E, "afii10062" }, /* CYRILLIC CAPITAL LETTER SHORT U */
02218     { 0x040F, "afii10145" }, /* CYRILLIC CAPITAL LETTER DZHE */
02219     { 0x0410, "afii10017" }, /* CYRILLIC CAPITAL LETTER A */
02220     { 0x0411, "afii10018" }, /* CYRILLIC CAPITAL LETTER BE */
02221     { 0x0412, "afii10019" }, /* CYRILLIC CAPITAL LETTER VE */
02222     { 0x0413, "afii10020" }, /* CYRILLIC CAPITAL LETTER GHE */
02223     { 0x0414, "afii10021" }, /* CYRILLIC CAPITAL LETTER DE */
02224     { 0x0415, "afii10022" }, /* CYRILLIC CAPITAL LETTER IE */
02225     { 0x0416, "afii10024" }, /* CYRILLIC CAPITAL LETTER ZHE */
02226     { 0x0417, "afii10025" }, /* CYRILLIC CAPITAL LETTER ZE */
02227     { 0x0418, "afii10026" }, /* CYRILLIC CAPITAL LETTER I */
02228     { 0x0419, "afii10027" }, /* CYRILLIC CAPITAL LETTER SHORT I */
02229     { 0x041A, "afii10028" }, /* CYRILLIC CAPITAL LETTER KA */
02230     { 0x041B, "afii10029" }, /* CYRILLIC CAPITAL LETTER EL */
02231     { 0x041C, "afii10030" }, /* CYRILLIC CAPITAL LETTER EM */
02232     { 0x041D, "afii10031" }, /* CYRILLIC CAPITAL LETTER EN */
02233     { 0x041E, "afii10032" }, /* CYRILLIC CAPITAL LETTER O */
02234     { 0x041F, "afii10033" }, /* CYRILLIC CAPITAL LETTER PE */
02235     { 0x0420, "afii10034" }, /* CYRILLIC CAPITAL LETTER ER */
02236     { 0x0421, "afii10035" }, /* CYRILLIC CAPITAL LETTER ES */
02237     { 0x0422, "afii10036" }, /* CYRILLIC CAPITAL LETTER TE */
02238     { 0x0423, "afii10037" }, /* CYRILLIC CAPITAL LETTER U */
02239     { 0x0424, "afii10038" }, /* CYRILLIC CAPITAL LETTER EF */
02240     { 0x0425, "afii10039" }, /* CYRILLIC CAPITAL LETTER HA */
02241     { 0x0426, "afii10040" }, /* CYRILLIC CAPITAL LETTER TSE */
02242     { 0x0427, "afii10041" }, /* CYRILLIC CAPITAL LETTER CHE */
02243     { 0x0428, "afii10042" }, /* CYRILLIC CAPITAL LETTER SHA */
02244     { 0x0429, "afii10043" }, /* CYRILLIC CAPITAL LETTER SHCHA */
02245     { 0x042A, "afii10044" }, /* CYRILLIC CAPITAL LETTER HARD SIGN */
02246     { 0x042B, "afii10045" }, /* CYRILLIC CAPITAL LETTER YERU */
02247     { 0x042C, "afii10046" }, /* CYRILLIC CAPITAL LETTER SOFT SIGN */
02248     { 0x042D, "afii10047" }, /* CYRILLIC CAPITAL LETTER E */
02249     { 0x042E, "afii10048" }, /* CYRILLIC CAPITAL LETTER YU */
02250     { 0x042F, "afii10049" }, /* CYRILLIC CAPITAL LETTER YA */
02251     { 0x0430, "afii10065" }, /* CYRILLIC SMALL LETTER A */
02252     { 0x0431, "afii10066" }, /* CYRILLIC SMALL LETTER BE */
02253     { 0x0432, "afii10067" }, /* CYRILLIC SMALL LETTER VE */
02254     { 0x0433, "afii10068" }, /* CYRILLIC SMALL LETTER GHE */
02255     { 0x0434, "afii10069" }, /* CYRILLIC SMALL LETTER DE */
02256     { 0x0435, "afii10070" }, /* CYRILLIC SMALL LETTER IE */
02257     { 0x0436, "afii10072" }, /* CYRILLIC SMALL LETTER ZHE */
02258     { 0x0437, "afii10073" }, /* CYRILLIC SMALL LETTER ZE */
02259     { 0x0438, "afii10074" }, /* CYRILLIC SMALL LETTER I */
02260     { 0x0439, "afii10075" }, /* CYRILLIC SMALL LETTER SHORT I */
02261     { 0x043A, "afii10076" }, /* CYRILLIC SMALL LETTER KA */
02262     { 0x043B, "afii10077" }, /* CYRILLIC SMALL LETTER EL */
02263     { 0x043C, "afii10078" }, /* CYRILLIC SMALL LETTER EM */
02264     { 0x043D, "afii10079" }, /* CYRILLIC SMALL LETTER EN */
02265     { 0x043E, "afii10080" }, /* CYRILLIC SMALL LETTER O */
02266     { 0x043F, "afii10081" }, /* CYRILLIC SMALL LETTER PE */
02267     { 0x0440, "afii10082" }, /* CYRILLIC SMALL LETTER ER */
02268     { 0x0441, "afii10083" }, /* CYRILLIC SMALL LETTER ES */
02269     { 0x0442, "afii10084" }, /* CYRILLIC SMALL LETTER TE */
02270     { 0x0443, "afii10085" }, /* CYRILLIC SMALL LETTER U */
02271     { 0x0444, "afii10086" }, /* CYRILLIC SMALL LETTER EF */
02272     { 0x0445, "afii10087" }, /* CYRILLIC SMALL LETTER HA */
02273     { 0x0446, "afii10088" }, /* CYRILLIC SMALL LETTER TSE */
02274     { 0x0447, "afii10089" }, /* CYRILLIC SMALL LETTER CHE */
02275     { 0x0448, "afii10090" }, /* CYRILLIC SMALL LETTER SHA */
02276     { 0x0449, "afii10091" }, /* CYRILLIC SMALL LETTER SHCHA */
02277     { 0x044A, "afii10092" }, /* CYRILLIC SMALL LETTER HARD SIGN */
02278     { 0x044B, "afii10093" }, /* CYRILLIC SMALL LETTER YERU */
02279     { 0x044C, "afii10094" }, /* CYRILLIC SMALL LETTER SOFT SIGN */
02280     { 0x044D, "afii10095" }, /* CYRILLIC SMALL LETTER E */
02281     { 0x044E, "afii10096" }, /* CYRILLIC SMALL LETTER YU */
02282     { 0x044F, "afii10097" }, /* CYRILLIC SMALL LETTER YA */
02283     { 0x0451, "afii10071" }, /* CYRILLIC SMALL LETTER IO */
02284     { 0x0452, "afii10099" }, /* CYRILLIC SMALL LETTER DJE */
02285     { 0x0453, "afii10100" }, /* CYRILLIC SMALL LETTER GJE */
02286     { 0x0454, "afii10101" }, /* CYRILLIC SMALL LETTER UKRAINIAN IE */
02287     { 0x0455, "afii10102" }, /* CYRILLIC SMALL LETTER DZE */
02288     { 0x0456, "afii10103" }, /* CYRILLIC SMALL LETTER BYELORUSSIAN-UKRAINIAN I */
02289     { 0x0457, "afii10104" }, /* CYRILLIC SMALL LETTER YI */
02290     { 0x0458, "afii10105" }, /* CYRILLIC SMALL LETTER JE */
02291     { 0x0459, "afii10106" }, /* CYRILLIC SMALL LETTER LJE */
02292     { 0x045A, "afii10107" }, /* CYRILLIC SMALL LETTER NJE */
02293     { 0x045B, "afii10108" }, /* CYRILLIC SMALL LETTER TSHE */
02294     { 0x045C, "afii10109" }, /* CYRILLIC SMALL LETTER KJE */
02295     { 0x045E, "afii10110" }, /* CYRILLIC SMALL LETTER SHORT U */
02296     { 0x045F, "afii10193" }, /* CYRILLIC SMALL LETTER DZHE */
02297     { 0x0462, "afii10146" }, /* CYRILLIC CAPITAL LETTER YAT */
02298     { 0x0463, "afii10194" }, /* CYRILLIC SMALL LETTER YAT */
02299     { 0x0472, "afii10147" }, /* CYRILLIC CAPITAL LETTER FITA */
02300     { 0x0473, "afii10195" }, /* CYRILLIC SMALL LETTER FITA */
02301     { 0x0474, "afii10148" }, /* CYRILLIC CAPITAL LETTER IZHITSA */
02302     { 0x0475, "afii10196" }, /* CYRILLIC SMALL LETTER IZHITSA */
02303     { 0x0490, "afii10050" }, /* CYRILLIC CAPITAL LETTER GHE WITH UPTURN */
02304     { 0x0491, "afii10098" }, /* CYRILLIC SMALL LETTER GHE WITH UPTURN */
02305     { 0x04D9, "afii10846" }, /* CYRILLIC SMALL LETTER SCHWA */
02306     { 0x05B0, "afii57799" }, /* HEBREW POINT SHEVA */
02307     { 0x05B1, "afii57801" }, /* HEBREW POINT HATAF SEGOL */
02308     { 0x05B2, "afii57800" }, /* HEBREW POINT HATAF PATAH */
02309     { 0x05B3, "afii57802" }, /* HEBREW POINT HATAF QAMATS */
02310     { 0x05B4, "afii57793" }, /* HEBREW POINT HIRIQ */
02311     { 0x05B5, "afii57794" }, /* HEBREW POINT TSERE */
02312     { 0x05B6, "afii57795" }, /* HEBREW POINT SEGOL */
02313     { 0x05B7, "afii57798" }, /* HEBREW POINT PATAH */
02314     { 0x05B8, "afii57797" }, /* HEBREW POINT QAMATS */
02315     { 0x05B9, "afii57806" }, /* HEBREW POINT HOLAM */
02316     { 0x05BB, "afii57796" }, /* HEBREW POINT QUBUTS */
02317     { 0x05BC, "afii57807" }, /* HEBREW POINT DAGESH OR MAPIQ */
02318     { 0x05BD, "afii57839" }, /* HEBREW POINT METEG */
02319     { 0x05BE, "afii57645" }, /* HEBREW PUNCTUATION MAQAF */
02320     { 0x05BF, "afii57841" }, /* HEBREW POINT RAFE */
02321     { 0x05C0, "afii57842" }, /* HEBREW PUNCTUATION PASEQ */
02322     { 0x05C1, "afii57804" }, /* HEBREW POINT SHIN DOT */
02323     { 0x05C2, "afii57803" }, /* HEBREW POINT SIN DOT */
02324     { 0x05C3, "afii57658" }, /* HEBREW PUNCTUATION SOF PASUQ */
02325     { 0x05D0, "afii57664" }, /* HEBREW LETTER ALEF */
02326     { 0x05D1, "afii57665" }, /* HEBREW LETTER BET */
02327     { 0x05D2, "afii57666" }, /* HEBREW LETTER GIMEL */
02328     { 0x05D3, "afii57667" }, /* HEBREW LETTER DALET */
02329     { 0x05D4, "afii57668" }, /* HEBREW LETTER HE */
02330     { 0x05D5, "afii57669" }, /* HEBREW LETTER VAV */
02331     { 0x05D6, "afii57670" }, /* HEBREW LETTER ZAYIN */
02332     { 0x05D7, "afii57671" }, /* HEBREW LETTER HET */
02333     { 0x05D8, "afii57672" }, /* HEBREW LETTER TET */
02334     { 0x05D9, "afii57673" }, /* HEBREW LETTER YOD */
02335     { 0x05DA, "afii57674" }, /* HEBREW LETTER FINAL KAF */
02336     { 0x05DB, "afii57675" }, /* HEBREW LETTER KAF */
02337     { 0x05DC, "afii57676" }, /* HEBREW LETTER LAMED */
02338     { 0x05DD, "afii57677" }, /* HEBREW LETTER FINAL MEM */
02339     { 0x05DE, "afii57678" }, /* HEBREW LETTER MEM */
02340     { 0x05DF, "afii57679" }, /* HEBREW LETTER FINAL NUN */
02341     { 0x05E0, "afii57680" }, /* HEBREW LETTER NUN */
02342     { 0x05E1, "afii57681" }, /* HEBREW LETTER SAMEKH */
02343     { 0x05E2, "afii57682" }, /* HEBREW LETTER AYIN */
02344     { 0x05E3, "afii57683" }, /* HEBREW LETTER FINAL PE */
02345     { 0x05E4, "afii57684" }, /* HEBREW LETTER PE */
02346     { 0x05E5, "afii57685" }, /* HEBREW LETTER FINAL TSADI */
02347     { 0x05E6, "afii57686" }, /* HEBREW LETTER TSADI */
02348     { 0x05E7, "afii57687" }, /* HEBREW LETTER QOF */
02349     { 0x05E8, "afii57688" }, /* HEBREW LETTER RESH */
02350     { 0x05E9, "afii57689" }, /* HEBREW LETTER SHIN */
02351     { 0x05EA, "afii57690" }, /* HEBREW LETTER TAV */
02352     { 0x05F0, "afii57716" }, /* HEBREW LIGATURE YIDDISH DOUBLE VAV */
02353     { 0x05F1, "afii57717" }, /* HEBREW LIGATURE YIDDISH VAV YOD */
02354     { 0x05F2, "afii57718" }, /* HEBREW LIGATURE YIDDISH DOUBLE YOD */
02355     { 0x060C, "afii57388" }, /* ARABIC COMMA */
02356     { 0x061B, "afii57403" }, /* ARABIC SEMICOLON */
02357     { 0x061F, "afii57407" }, /* ARABIC QUESTION MARK */
02358     { 0x0621, "afii57409" }, /* ARABIC LETTER HAMZA */
02359     { 0x0622, "afii57410" }, /* ARABIC LETTER ALEF WITH MADDA ABOVE */
02360     { 0x0623, "afii57411" }, /* ARABIC LETTER ALEF WITH HAMZA ABOVE */
02361     { 0x0624, "afii57412" }, /* ARABIC LETTER WAW WITH HAMZA ABOVE */
02362     { 0x0625, "afii57413" }, /* ARABIC LETTER ALEF WITH HAMZA BELOW */
02363     { 0x0626, "afii57414" }, /* ARABIC LETTER YEH WITH HAMZA ABOVE */
02364     { 0x0627, "afii57415" }, /* ARABIC LETTER ALEF */
02365     { 0x0628, "afii57416" }, /* ARABIC LETTER BEH */
02366     { 0x0629, "afii57417" }, /* ARABIC LETTER TEH MARBUTA */
02367     { 0x062A, "afii57418" }, /* ARABIC LETTER TEH */
02368     { 0x062B, "afii57419" }, /* ARABIC LETTER THEH */
02369     { 0x062C, "afii57420" }, /* ARABIC LETTER JEEM */
02370     { 0x062D, "afii57421" }, /* ARABIC LETTER HAH */
02371     { 0x062E, "afii57422" }, /* ARABIC LETTER KHAH */
02372     { 0x062F, "afii57423" }, /* ARABIC LETTER DAL */
02373     { 0x0630, "afii57424" }, /* ARABIC LETTER THAL */
02374     { 0x0631, "afii57425" }, /* ARABIC LETTER REH */
02375     { 0x0632, "afii57426" }, /* ARABIC LETTER ZAIN */
02376     { 0x0633, "afii57427" }, /* ARABIC LETTER SEEN */
02377     { 0x0634, "afii57428" }, /* ARABIC LETTER SHEEN */
02378     { 0x0635, "afii57429" }, /* ARABIC LETTER SAD */
02379     { 0x0636, "afii57430" }, /* ARABIC LETTER DAD */
02380     { 0x0637, "afii57431" }, /* ARABIC LETTER TAH */
02381     { 0x0638, "afii57432" }, /* ARABIC LETTER ZAH */
02382     { 0x0639, "afii57433" }, /* ARABIC LETTER AIN */
02383     { 0x063A, "afii57434" }, /* ARABIC LETTER GHAIN */
02384     { 0x0640, "afii57440" }, /* ARABIC TATWEEL */
02385     { 0x0641, "afii57441" }, /* ARABIC LETTER FEH */
02386     { 0x0642, "afii57442" }, /* ARABIC LETTER QAF */
02387     { 0x0643, "afii57443" }, /* ARABIC LETTER KAF */
02388     { 0x0644, "afii57444" }, /* ARABIC LETTER LAM */
02389     { 0x0645, "afii57445" }, /* ARABIC LETTER MEEM */
02390     { 0x0646, "afii57446" }, /* ARABIC LETTER NOON */
02391     { 0x0647, "afii57470" }, /* ARABIC LETTER HEH */
02392     { 0x0648, "afii57448" }, /* ARABIC LETTER WAW */
02393     { 0x0649, "afii57449" }, /* ARABIC LETTER ALEF MAKSURA */
02394     { 0x064A, "afii57450" }, /* ARABIC LETTER YEH */
02395     { 0x064B, "afii57451" }, /* ARABIC FATHATAN */
02396     { 0x064C, "afii57452" }, /* ARABIC DAMMATAN */
02397     { 0x064D, "afii57453" }, /* ARABIC KASRATAN */
02398     { 0x064E, "afii57454" }, /* ARABIC FATHA */
02399     { 0x064F, "afii57455" }, /* ARABIC DAMMA */
02400     { 0x0650, "afii57456" }, /* ARABIC KASRA */
02401     { 0x0651, "afii57457" }, /* ARABIC SHADDA */
02402     { 0x0652, "afii57458" }, /* ARABIC SUKUN */
02403     { 0x0660, "afii57392" }, /* ARABIC-INDIC DIGIT ZERO */
02404     { 0x0661, "afii57393" }, /* ARABIC-INDIC DIGIT ONE */
02405     { 0x0662, "afii57394" }, /* ARABIC-INDIC DIGIT TWO */
02406     { 0x0663, "afii57395" }, /* ARABIC-INDIC DIGIT THREE */
02407     { 0x0664, "afii57396" }, /* ARABIC-INDIC DIGIT FOUR */
02408     { 0x0665, "afii57397" }, /* ARABIC-INDIC DIGIT FIVE */
02409     { 0x0666, "afii57398" }, /* ARABIC-INDIC DIGIT SIX */
02410     { 0x0667, "afii57399" }, /* ARABIC-INDIC DIGIT SEVEN */
02411     { 0x0668, "afii57400" }, /* ARABIC-INDIC DIGIT EIGHT */
02412     { 0x0669, "afii57401" }, /* ARABIC-INDIC DIGIT NINE */
02413     { 0x066A, "afii57381" }, /* ARABIC PERCENT SIGN */
02414     { 0x066D, "afii63167" }, /* ARABIC FIVE POINTED STAR */
02415     { 0x0679, "afii57511" }, /* ARABIC LETTER TTEH */
02416     { 0x067E, "afii57506" }, /* ARABIC LETTER PEH */
02417     { 0x0686, "afii57507" }, /* ARABIC LETTER TCHEH */
02418     { 0x0688, "afii57512" }, /* ARABIC LETTER DDAL */
02419     { 0x0691, "afii57513" }, /* ARABIC LETTER RREH */
02420     { 0x0698, "afii57508" }, /* ARABIC LETTER JEH */
02421     { 0x06A4, "afii57505" }, /* ARABIC LETTER VEH */
02422     { 0x06AF, "afii57509" }, /* ARABIC LETTER GAF */
02423     { 0x06BA, "afii57514" }, /* ARABIC LETTER NOON GHUNNA */
02424     { 0x06D2, "afii57519" }, /* ARABIC LETTER YEH BARREE */
02425     { 0x06D5, "afii57534" }, /* ARABIC LETTER AE */
02426     { 0x1E80, "Wgrave" }, /* LATIN CAPITAL LETTER W WITH GRAVE */
02427     { 0x1E81, "wgrave" }, /* LATIN SMALL LETTER W WITH GRAVE */
02428     { 0x1E82, "Wacute" }, /* LATIN CAPITAL LETTER W WITH ACUTE */
02429     { 0x1E83, "wacute" }, /* LATIN SMALL LETTER W WITH ACUTE */
02430     { 0x1E84, "Wdieresis" }, /* LATIN CAPITAL LETTER W WITH DIAERESIS */
02431     { 0x1E85, "wdieresis" }, /* LATIN SMALL LETTER W WITH DIAERESIS */
02432     { 0x1EF2, "Ygrave" }, /* LATIN CAPITAL LETTER Y WITH GRAVE */
02433     { 0x1EF3, "ygrave" }, /* LATIN SMALL LETTER Y WITH GRAVE */
02434     { 0x200C, "afii61664" }, /* ZERO WIDTH NON-JOINER */
02435     { 0x200D, "afii301" }, /* ZERO WIDTH JOINER */
02436     { 0x200E, "afii299" }, /* LEFT-TO-RIGHT MARK */
02437     { 0x200F, "afii300" }, /* RIGHT-TO-LEFT MARK */
02438     { 0x2012, "figuredash" }, /* FIGURE DASH */
02439     { 0x2013, "endash" }, /* EN DASH */
02440     { 0x2014, "emdash" }, /* EM DASH */
02441     { 0x2015, "afii00208" }, /* HORIZONTAL BAR */
02442     { 0x2017, "underscoredbl" }, /* DOUBLE LOW LINE */
02443     { 0x2018, "quoteleft" }, /* LEFT SINGLE QUOTATION MARK */
02444     { 0x2019, "quoteright" }, /* RIGHT SINGLE QUOTATION MARK */
02445     { 0x201A, "quotesinglbase" }, /* SINGLE LOW-9 QUOTATION MARK */
02446     { 0x201B, "quotereversed" }, /* SINGLE HIGH-REVERSED-9 QUOTATION MARK */
02447     { 0x201C, "quotedblleft" }, /* LEFT DOUBLE QUOTATION MARK */
02448     { 0x201D, "quotedblright" }, /* RIGHT DOUBLE QUOTATION MARK */
02449     { 0x201E, "quotedblbase" }, /* DOUBLE LOW-9 QUOTATION MARK */
02450     { 0x201F, "$quotedblreversed" }, /* DOUBLE HIGH-REVERSED-9 QUOTATION MARK */
02451     { 0x2020, "dagger" }, /* DAGGER */
02452     { 0x2021, "daggerdbl" }, /* DOUBLE DAGGER */
02453     { 0x2022, "bullet" }, /* BULLET */
02454     { 0x2024, "onedotenleader" }, /* ONE DOT LEADER */
02455     { 0x2025, "twodotenleader" }, /* TWO DOT LEADER */
02456     { 0x2026, "ellipsis" }, /* HORIZONTAL ELLIPSIS */
02457     { 0x202C, "afii61573" }, /* POP DIRECTIONAL FORMATTING */
02458     { 0x202D, "afii61574" }, /* LEFT-TO-RIGHT OVERRIDE */
02459     { 0x202E, "afii61575" }, /* RIGHT-TO-LEFT OVERRIDE */
02460     { 0x2030, "perthousand" }, /* PER MILLE SIGN */
02461     { 0x2032, "minute" }, /* PRIME */
02462     { 0x2033, "second" }, /* DOUBLE PRIME */
02463     { 0x2039, "guilsinglleft" }, /* SINGLE LEFT-POINTING ANGLE QUOTATION MARK */
02464     { 0x203A, "guilsinglright" }, /* SINGLE RIGHT-POINTING ANGLE QUOTATION MARK */
02465     { 0x203C, "exclamdbl" }, /* DOUBLE EXCLAMATION MARK */
02466     { 0x2040, "$tie" }, /* CHARACTER TIE */
02467     { 0x2044, "fraction" }, /* FRACTION SLASH */
02468     { 0x2044, "$fractionslash" }, /* FRACTION SLASH; distinguish Adobe duplicates */
02469     { 0x2070, "zerosuperior" }, /* SUPERSCRIPT ZERO */
02470     { 0x2074, "foursuperior" }, /* SUPERSCRIPT FOUR */
02471     { 0x2075, "fivesuperior" }, /* SUPERSCRIPT FIVE */
02472     { 0x2076, "sixsuperior" }, /* SUPERSCRIPT SIX */
02473     { 0x2077, "sevensuperior" }, /* SUPERSCRIPT SEVEN */
02474     { 0x2078, "eightsuperior" }, /* SUPERSCRIPT EIGHT */
02475     { 0x2079, "ninesuperior" }, /* SUPERSCRIPT NINE */
02476     { 0x207D, "parenleftsuperior" }, /* SUPERSCRIPT LEFT PARENTHESIS */
02477     { 0x207E, "parenrightsuperior" }, /* SUPERSCRIPT RIGHT PARENTHESIS */
02478     { 0x207F, "nsuperior" }, /* SUPERSCRIPT LATIN SMALL LETTER N */
02479     { 0x2080, "zeroinferior" }, /* SUBSCRIPT ZERO */
02480     { 0x2081, "oneinferior" }, /* SUBSCRIPT ONE */
02481     { 0x2082, "twoinferior" }, /* SUBSCRIPT TWO */
02482     { 0x2083, "threeinferior" }, /* SUBSCRIPT THREE */
02483     { 0x2084, "fourinferior" }, /* SUBSCRIPT FOUR */
02484     { 0x2085, "fiveinferior" }, /* SUBSCRIPT FIVE */
02485     { 0x2086, "sixinferior" }, /* SUBSCRIPT SIX */
02486     { 0x2087, "seveninferior" }, /* SUBSCRIPT SEVEN */
02487     { 0x2088, "eightinferior" }, /* SUBSCRIPT EIGHT */
02488     { 0x2089, "nineinferior" }, /* SUBSCRIPT NINE */
02489     { 0x208D, "parenleftinferior" }, /* SUBSCRIPT LEFT PARENTHESIS */
02490     { 0x208E, "parenrightinferior" }, /* SUBSCRIPT RIGHT PARENTHESIS */
02491     { 0x20A1, "colonmonetary" }, /* COLON SIGN */
02492     { 0x20A3, "franc" }, /* FRENCH FRANC SIGN */
02493     { 0x20A4, "lira" }, /* LIRA SIGN */
02494     { 0x20A7, "peseta" }, /* PESETA SIGN */
02495     { 0x20AA, "afii57636" }, /* NEW SHEQEL SIGN */
02496     { 0x20AB, "dong" }, /* DONG SIGN */
02497     { 0x20AC, "Euro" }, /* EURO SIGN */
02498     { 0x20D7, "$vectorcomb" }, /* COMBINING RIGHT ARROW ABOVE */
02499     { 0x20DD, "$circlecomb" }, /* COMBINING ENCLOSING CIRCLE */
02500     { 0x2105, "afii61248" }, /* CARE OF */
02501     { 0x2111, "Ifraktur" }, /* BLACK-LETTER CAPITAL I */
02502     { 0x2113, "afii61289" }, /* SCRIPT SMALL L */
02503     { 0x2113, "$lscript" }, /* SCRIPT SMALL L; Adobe has this as "afii61289" */
02504     { 0x2116, "afii61352" }, /* NUMERO SIGN */
02505     { 0x2118, "weierstrass" }, /* SCRIPT CAPITAL P */
02506     { 0x211C, "Rfraktur" }, /* BLACK-LETTER CAPITAL R */
02507     { 0x211E, "prescription" }, /* PRESCRIPTION TAKE */
02508     { 0x2122, "trademark" }, /* TRADE MARK SIGN */
02509     { 0x2126, "$Ohm"  }, /* OHM SIGN; distinguish Adobe duplicates */
02510     { 0x2126, "Omega" }, /* OHM SIGN */
02511     { 0x212E, "estimated" }, /* ESTIMATED SYMBOL */
02512     { 0x2135, "aleph" }, /* ALEF SYMBOL */
02513     { 0x2153, "onethird" }, /* VULGAR FRACTION ONE THIRD */
02514     { 0x2154, "twothirds" }, /* VULGAR FRACTION TWO THIRDS */
02515     { 0x215B, "oneeighth" }, /* VULGAR FRACTION ONE EIGHTH */
02516     { 0x215C, "threeeighths" }, /* VULGAR FRACTION THREE EIGHTHS */
02517     { 0x215D, "fiveeighths" }, /* VULGAR FRACTION FIVE EIGHTHS */
02518     { 0x215E, "seveneighths" }, /* VULGAR FRACTION SEVEN EIGHTHS */
02519     { 0x2190, "arrowleft" }, /* LEFTWARDS ARROW */
02520     { 0x2191, "arrowup" }, /* UPWARDS ARROW */
02521     { 0x2192, "arrowright" }, /* RIGHTWARDS ARROW */
02522     { 0x2193, "arrowdown" }, /* DOWNWARDS ARROW */
02523     { 0x2194, "arrowboth" }, /* LEFT RIGHT ARROW */
02524     { 0x2195, "arrowupdn" }, /* UP DOWN ARROW */
02525     { 0x2196, "$arrownorthwest" }, /* NORTH WEST ARROW */
02526     { 0x2197, "$arrownortheast" }, /* NORTH EAST ARROW */
02527     { 0x2198, "$arrowsoutheast" }, /* SOUTH EAST ARROW */
02528     { 0x2199, "$arrowsouthwest" }, /* SOUTH WEST ARROW */
02529     { 0x21A8, "arrowupdnbse" }, /* UP DOWN ARROW WITH BASE */
02530     { 0x21B5, "carriagereturn" }, /* DOWNWARDS ARROW WITH CORNER LEFTWARDS */
02531     { 0x21BC, "$harpoonleftbarbup" }, /* LEFTWARDS HARPOON WITH BARB UPWARDS */
02532     { 0x21BD, "$harpoonleftbarbdown" }, /* LEFTWARDS HARPOON WITH BARB DOWNWARDS */
02533     { 0x21C0, "$harpoonrightbarbup" }, /* RIGHTWARDS HARPOON WITH BARB UPWARDS */
02534     { 0x21C1, "$harpoonrightbarbdown" }, /* RIGHTWARDS HARPOON WITH BARB DOWNWARDS */
02535     { 0x21D0, "arrowdblleft" }, /* LEFTWARDS DOUBLE ARROW */
02536     { 0x21D1, "arrowdblup" }, /* UPWARDS DOUBLE ARROW */
02537     { 0x21D2, "arrowdblright" }, /* RIGHTWARDS DOUBLE ARROW */
02538     { 0x21D3, "arrowdbldown" }, /* DOWNWARDS DOUBLE ARROW */
02539     { 0x21D4, "arrowdblboth" }, /* LEFT RIGHT DOUBLE ARROW */
02540     { 0x21D5, "$arrowdblupdn" }, /* UP DOWN DOUBLE ARROW */
02541     { 0x2200, "universal" }, /* FOR ALL */
02542     { 0x2202, "partialdiff" }, /* PARTIAL DIFFERENTIAL */
02543     { 0x2203, "existential" }, /* THERE EXISTS */
02544     { 0x2205, "emptyset" }, /* EMPTY SET */
02545     { 0x2206, "Delta" }, /* INCREMENT */
02546     { 0x2206, "$increment"  }, /* INCREMENT; distinguish Adobe duplicates */
02547     { 0x2207, "gradient" }, /* NABLA */
02548     { 0x2208, "element" }, /* ELEMENT OF */
02549     { 0x2209, "notelement" }, /* NOT AN ELEMENT OF */
02550     { 0x220B, "suchthat" }, /* CONTAINS AS MEMBER */
02551     { 0x220F, "product" }, /* N-ARY PRODUCT */
02552     { 0x2210, "$coproduct" }, /* N-ARY COPRODUCT */
02553     { 0x2211, "summation" }, /* N-ARY SUMMATION */
02554     { 0x2212, "minus" }, /* MINUS SIGN */
02555     { 0x2213, "$minusplus" }, /* MINUS-OR-PLUS SIGN */
02556     { 0x2215, "$divisionslash" }, /* DIVISION SLASH; distinguish Adobe duplicates */
02557     { 0x2217, "asteriskmath" }, /* ASTERISK OPERATOR */
02558     { 0x2219, "$bulletmath"  }, /* BULLET OPERATOR; distinguish Adobe duplicates */
02559     { 0x221A, "radical" }, /* SQUARE ROOT */
02560     { 0x221D, "proportional" }, /* PROPORTIONAL TO */
02561     { 0x221E, "infinity" }, /* INFINITY */
02562     { 0x221F, "orthogonal" }, /* RIGHT ANGLE */
02563     { 0x2220, "angle" }, /* ANGLE */
02564     { 0x2225, "$parallel" }, /* PARALLEL TO */
02565     { 0x2227, "logicaland" }, /* LOGICAL AND */
02566     { 0x2228, "logicalor" }, /* LOGICAL OR */
02567     { 0x2229, "intersection" }, /* INTERSECTION */
02568     { 0x222A, "union" }, /* UNION */
02569     { 0x222B, "integral" }, /* INTEGRAL */
02570     { 0x222E, "$contintegral" }, /* CONTOUR INTEGRAL */
02571     { 0x2234, "therefore" }, /* THEREFORE */
02572     { 0x223C, "similar" }, /* TILDE OPERATOR */
02573     { 0x2240, "$wreathproduct" }, /* WREATH PRODUCT */
02574     { 0x2243, "$similarequal" }, /* ASYMPTOTICALLY EQUAL TO */
02575     { 0x2245, "congruent" }, /* APPROXIMATELY EQUAL TO */
02576     { 0x2248, "approxequal" }, /* ALMOST EQUAL TO */
02577     { 0x224D, "$equivasymptotic" }, /* EQUIVALENT TO */
02578     { 0x2260, "notequal" }, /* NOT EQUAL TO */
02579     { 0x2261, "equivalence" }, /* IDENTICAL TO */
02580     { 0x2264, "lessequal" }, /* LESS-THAN OR EQUAL TO */
02581     { 0x2265, "greaterequal" }, /* GREATER-THAN OR EQUAL TO */
02582     { 0x226A, "$lessmuch" }, /* MUCH-LESS THAN */
02583     { 0x226B, "$greatermuch" }, /* MUCH GREATER-THAN */
02584     { 0x227A, "$precedes" }, /* PRECEDES */
02585     { 0x227B, "$follows" }, /* SUCCEEDS */
02586     { 0x227C, "$precedesequal" }, /* PRECEDES OR EQUAL TO */
02587     { 0x227D, "$followsequal" }, /* SUCCEEDS OR EQUAL TO */
02588     { 0x2282, "propersubset" }, /* SUBSET OF */
02589     { 0x2283, "propersuperset" }, /* SUPERSET OF */
02590     { 0x2284, "notsubset" }, /* NOT A SUBSET OF */
02591     { 0x2286, "reflexsubset" }, /* SUBSET OF OR EQUAL TO */
02592     { 0x2287, "reflexsuperset" }, /* SUPERSET OF OR EQUAL TO */
02593     { 0x228E, "$unionmulti" }, /* MULTISET UNION */
02594     { 0x2291, "$reflexsubsetsq" }, /* SQUARE IMAGE OF OR EQUAL TO */
02595     { 0x2292, "$reflexsupersetsq" }, /* SQUARE ORIGINAL OF OR EQUAL TO */
02596     { 0x2293, "$intersectionsq" }, /* SQUARE CAP */
02597     { 0x2294, "$unionsq" }, /* SQUARE CUP */
02598     { 0x2295, "circleplus" }, /* CIRCLED PLUS */
02599     { 0x2296, "$circleminus" }, /* CIRCLED MINUS */
02600     { 0x2297, "circlemultiply" }, /* CIRCLED TIMES */
02601     { 0x2298, "$circledivide" }, /* CIRCLED DIVISION SLASH */
02602     { 0x2299, "$circledot" }, /* CIRCLED DOT OPERATOR */
02603     { 0x22A2, "$turnstileleft" }, /* RIGHT TACK */
02604     { 0x22A3, "$turnstileright" }, /* LEFT TACK */
02605     { 0x22A4, "$latticetop" }, /* DOWN TACK */
02606     { 0x22A5, "perpendicular" }, /* UP TACK */
02607     { 0x22B2, "$normalin" }, /* NORMAL SUBGROUP OF */
02608     { 0x22B3, "$normalizes" }, /* CONTAINS AS NORMAL SUBGROUP */
02609     { 0x22B4, "$reflexnormalin" }, /* NORMAL SUBGROUP OF OR EQUAL TO */
02610     { 0x22B5, "$reflexnormalizes" }, /* CONTAINS AS NORMAL SUBGROUP OR EQUAL TO */
02611     { 0x22C4, "$diamondmath" }, /* DIAMOND OPERATOR */
02612     { 0x22C5, "dotmath" }, /* DOT OPERATOR */
02613     { 0x22C6, "$starmath" }, /* STAR OPERATOR */
02614     { 0x2302, "house" }, /* HOUSE */
02615     { 0x2308, "$ceilingleft" }, /* LEFT CEILING */
02616     { 0x2309, "$ceilingright" }, /* RIGHT CEILING */
02617     { 0x230A, "$floorleft" }, /* LEFT FLOOR */
02618     { 0x230B, "$floorright" }, /* RIGHT FLOOR */
02619     { 0x2310, "revlogicalnot" }, /* REVERSED NOT SIGN */
02620     { 0x2320, "integraltp" }, /* TOP HALF INTEGRAL */
02621     { 0x2321, "integralbt" }, /* BOTTOM HALF INTEGRAL */
02622     { 0x2322, "$frown" }, /* FROWN */
02623     { 0x2323, "$smile" }, /* SMILE */
02624     { 0x2329, "angleleft" }, /* LEFT-POINTING ANGLE BRACKET */
02625     { 0x232A, "angleright" }, /* RIGHT-POINTING ANGLE BRACKET */
02626     { 0x2420, "$spacesymbol" }, /* SYMBOL FOR SPACE */
02627     { 0x2500, "SF100000" }, /* BOX DRAWINGS LIGHT HORIZONTAL */
02628     { 0x2502, "SF110000" }, /* BOX DRAWINGS LIGHT VERTICAL */
02629     { 0x250C, "SF010000" }, /* BOX DRAWINGS LIGHT DOWN AND RIGHT */
02630     { 0x2510, "SF030000" }, /* BOX DRAWINGS LIGHT DOWN AND LEFT */
02631     { 0x2514, "SF020000" }, /* BOX DRAWINGS LIGHT UP AND RIGHT */
02632     { 0x2518, "SF040000" }, /* BOX DRAWINGS LIGHT UP AND LEFT */
02633     { 0x251C, "SF080000" }, /* BOX DRAWINGS LIGHT VERTICAL AND RIGHT */
02634     { 0x2524, "SF090000" }, /* BOX DRAWINGS LIGHT VERTICAL AND LEFT */
02635     { 0x252C, "SF060000" }, /* BOX DRAWINGS LIGHT DOWN AND HORIZONTAL */
02636     { 0x2534, "SF070000" }, /* BOX DRAWINGS LIGHT UP AND HORIZONTAL */
02637     { 0x253C, "SF050000" }, /* BOX DRAWINGS LIGHT VERTICAL AND HORIZONTAL */
02638     { 0x2550, "SF430000" }, /* BOX DRAWINGS DOUBLE HORIZONTAL */
02639     { 0x2551, "SF240000" }, /* BOX DRAWINGS DOUBLE VERTICAL */
02640     { 0x2552, "SF510000" }, /* BOX DRAWINGS DOWN SINGLE AND RIGHT DOUBLE */
02641     { 0x2553, "SF520000" }, /* BOX DRAWINGS DOWN DOUBLE AND RIGHT SINGLE */
02642     { 0x2554, "SF390000" }, /* BOX DRAWINGS DOUBLE DOWN AND RIGHT */
02643     { 0x2555, "SF220000" }, /* BOX DRAWINGS DOWN SINGLE AND LEFT DOUBLE */
02644     { 0x2556, "SF210000" }, /* BOX DRAWINGS DOWN DOUBLE AND LEFT SINGLE */
02645     { 0x2557, "SF250000" }, /* BOX DRAWINGS DOUBLE DOWN AND LEFT */
02646     { 0x2558, "SF500000" }, /* BOX DRAWINGS UP SINGLE AND RIGHT DOUBLE */
02647     { 0x2559, "SF490000" }, /* BOX DRAWINGS UP DOUBLE AND RIGHT SINGLE */
02648     { 0x255A, "SF380000" }, /* BOX DRAWINGS DOUBLE UP AND RIGHT */
02649     { 0x255B, "SF280000" }, /* BOX DRAWINGS UP SINGLE AND LEFT DOUBLE */
02650     { 0x255C, "SF270000" }, /* BOX DRAWINGS UP DOUBLE AND LEFT SINGLE */
02651     { 0x255D, "SF260000" }, /* BOX DRAWINGS DOUBLE UP AND LEFT */
02652     { 0x255E, "SF360000" }, /* BOX DRAWINGS VERTICAL SINGLE AND RIGHT DOUBLE */
02653     { 0x255F, "SF370000" }, /* BOX DRAWINGS VERTICAL DOUBLE AND RIGHT SINGLE */
02654     { 0x2560, "SF420000" }, /* BOX DRAWINGS DOUBLE VERTICAL AND RIGHT */
02655     { 0x2561, "SF190000" }, /* BOX DRAWINGS VERTICAL SINGLE AND LEFT DOUBLE */
02656     { 0x2562, "SF200000" }, /* BOX DRAWINGS VERTICAL DOUBLE AND LEFT SINGLE */
02657     { 0x2563, "SF230000" }, /* BOX DRAWINGS DOUBLE VERTICAL AND LEFT */
02658     { 0x2564, "SF470000" }, /* BOX DRAWINGS DOWN SINGLE AND HORIZONTAL DOUBLE */
02659     { 0x2565, "SF480000" }, /* BOX DRAWINGS DOWN DOUBLE AND HORIZONTAL SINGLE */
02660     { 0x2566, "SF410000" }, /* BOX DRAWINGS DOUBLE DOWN AND HORIZONTAL */
02661     { 0x2567, "SF450000" }, /* BOX DRAWINGS UP SINGLE AND HORIZONTAL DOUBLE */
02662     { 0x2568, "SF460000" }, /* BOX DRAWINGS UP DOUBLE AND HORIZONTAL SINGLE */
02663     { 0x2569, "SF400000" }, /* BOX DRAWINGS DOUBLE UP AND HORIZONTAL */
02664     { 0x256A, "SF540000" }, /* BOX DRAWINGS VERTICAL SINGLE AND HORIZONTAL DOUBLE */
02665     { 0x256B, "SF530000" }, /* BOX DRAWINGS VERTICAL DOUBLE AND HORIZONTAL SINGLE */
02666     { 0x256C, "SF440000" }, /* BOX DRAWINGS DOUBLE VERTICAL AND HORIZONTAL */
02667     { 0x2580, "upblock" }, /* UPPER HALF BLOCK */
02668     { 0x2584, "dnblock" }, /* LOWER HALF BLOCK */
02669     { 0x2588, "block" }, /* FULL BLOCK */
02670     { 0x258C, "lfblock" }, /* LEFT HALF BLOCK */
02671     { 0x2590, "rtblock" }, /* RIGHT HALF BLOCK */
02672     { 0x2591, "ltshade" }, /* LIGHT SHADE */
02673     { 0x2592, "shade" }, /* MEDIUM SHADE */
02674     { 0x2593, "dkshade" }, /* DARK SHADE */
02675     { 0x25A0, "filledbox" }, /* BLACK SQUARE */
02676     { 0x25A1, "H22073" }, /* WHITE SQUARE */
02677     { 0x25AA, "H18543" }, /* BLACK SMALL SQUARE */
02678     { 0x25AB, "H18551" }, /* WHITE SMALL SQUARE */
02679     { 0x25AC, "filledrect" }, /* BLACK RECTANGLE */
02680     { 0x25B2, "triagup" }, /* BLACK UP-POINTING TRIANGLE */
02681     { 0x25B3, "$triagwhiteup" }, /* WHITE UP-POINTING TRIANGLE */
02682     { 0x25BA, "triagrt" }, /* BLACK RIGHT-POINTING POINTER */
02683     { 0x25BC, "triagdn" }, /* BLACK DOWN-POINTING TRIANGLE */
02684     { 0x25BD, "$triagwhitedn" }, /* WHITE DOWN-POINTING TRIANGLE */
02685     { 0x25C4, "triaglf" }, /* BLACK LEFT-POINTING POINTER */
02686     { 0x25CA, "lozenge" }, /* LOZENGE */
02687     { 0x25CB, "circle" }, /* WHITE CIRCLE */
02688     { 0x25CF, "H18533" }, /* BLACK CIRCLE */
02689     { 0x25D8, "invbullet" }, /* INVERSE BULLET */
02690     { 0x25D9, "invcircle" }, /* INVERSE WHITE CIRCLE */
02691     { 0x25E6, "openbullet" }, /* WHITE BULLET */
02692     { 0x25EF, "$circlelarge" }, /* LARGE CIRCLE */
02693     { 0x263A, "smileface" }, /* WHITE SMILING FACE */
02694     { 0x263B, "invsmileface" }, /* BLACK SMILING FACE */
02695     { 0x263C, "sun" }, /* WHITE SUN WITH RAYS */
02696     { 0x2640, "female" }, /* FEMALE SIGN */
02697     { 0x2642, "male" }, /* MALE SIGN */
02698     { 0x2660, "spade" }, /* BLACK SPADE SUIT */
02699     { 0x2663, "club" }, /* BLACK CLUB SUIT */
02700     { 0x2665, "heart" }, /* BLACK HEART SUIT */
02701     { 0x2666, "diamond" }, /* BLACK DIAMOND SUIT */
02702     { 0x266A, "musicalnote" }, /* EIGHTH NOTE */
02703     { 0x266B, "musicalnotedbl" }, /* BEAMED EIGHTH NOTES */
02704     { 0x266D, "$flat" }, /* MUSIC FLAT SIGN */
02705     { 0x266E, "$natural" }, /* MUSIC NATURAL SIGN */
02706     { 0x266F, "$sharp" }, /* MUSIC SHARP SIGN */
02707     { 0xF6BE, "dotlessj" }, /* LATIN SMALL LETTER DOTLESS J */
02708     { 0xF6BF, "LL" }, /* LATIN CAPITAL LETTER LL */
02709     { 0xF6C0, "ll" }, /* LATIN SMALL LETTER LL */
02710     { 0xF6C3, "commaaccent" }, /* COMMA BELOW */
02711     { 0xF6C4, "afii10063" }, /* CYRILLIC SMALL LETTER GHE VARIANT */
02712     { 0xF6C5, "afii10064" }, /* CYRILLIC SMALL LETTER BE VARIANT */
02713     { 0xF6C6, "afii10192" }, /* CYRILLIC SMALL LETTER DE VARIANT */
02714     { 0xF6C7, "afii10831" }, /* CYRILLIC SMALL LETTER PE VARIANT */
02715     { 0xF6C8, "afii10832" }, /* CYRILLIC SMALL LETTER TE VARIANT */
02716     { 0xF6C9, "Acute" }, /* CAPITAL ACUTE ACCENT */
02717     { 0xF6CA, "Caron" }, /* CAPITAL CARON */
02718     { 0xF6CB, "Dieresis" }, /* CAPITAL DIAERESIS */
02719     { 0xF6CC, "DieresisAcute" }, /* CAPITAL DIAERESIS ACUTE ACCENT */
02720     { 0xF6CD, "DieresisGrave" }, /* CAPITAL DIAERESIS GRAVE ACCENT */
02721     { 0xF6CE, "Grave" }, /* CAPITAL GRAVE ACCENT */
02722     { 0xF6CF, "Hungarumlaut" }, /* CAPITAL DOUBLE ACUTE ACCENT */
02723     { 0xF6D0, "Macron" }, /* CAPITAL MACRON */
02724     { 0xF6D1, "cyrBreve" }, /* CAPITAL CYRILLIC BREVE */
02725     { 0xF6D2, "cyrFlex" }, /* CAPITAL CYRILLIC CIRCUMFLEX */
02726     { 0xF6D3, "dblGrave" }, /* CAPITAL DOUBLE GRAVE ACCENT */
02727     { 0xF6D4, "cyrbreve" }, /* CYRILLIC BREVE */
02728     { 0xF6D5, "cyrflex" }, /* CYRILLIC CIRCUMFLEX */
02729     { 0xF6D6, "dblgrave" }, /* DOUBLE GRAVE ACCENT */
02730     { 0xF6D7, "dieresisacute" }, /* DIAERESIS ACUTE ACCENT */
02731     { 0xF6D8, "dieresisgrave" }, /* DIAERESIS GRAVE ACCENT */
02732     { 0xF6D9, "copyrightserif" }, /* COPYRIGHT SIGN SERIF */
02733     { 0xF6DA, "registerserif" }, /* REGISTERED SIGN SERIF */
02734     { 0xF6DB, "trademarkserif" }, /* TRADE MARK SIGN SERIF */
02735     { 0xF6DC, "onefitted" }, /* PROPORTIONAL DIGIT ONE */
02736     { 0xF6DD, "rupiah" }, /* RUPIAH SIGN */
02737     { 0xF6DE, "threequartersemdash" }, /* THREE QUARTERS EM DASH */
02738     { 0xF6DF, "centinferior" }, /* SUBSCRIPT CENT SIGN */
02739     { 0xF6E0, "centsuperior" }, /* SUPERSCRIPT CENT SIGN */
02740     { 0xF6E1, "commainferior" }, /* SUBSCRIPT COMMA */
02741     { 0xF6E2, "commasuperior" }, /* SUPERSCRIPT COMMA */
02742     { 0xF6E3, "dollarinferior" }, /* SUBSCRIPT DOLLAR SIGN */
02743     { 0xF6E4, "dollarsuperior" }, /* SUPERSCRIPT DOLLAR SIGN */
02744     { 0xF6E5, "hypheninferior" }, /* SUBSCRIPT HYPHEN-MINUS */
02745     { 0xF6E6, "hyphensuperior" }, /* SUPERSCRIPT HYPHEN-MINUS */
02746     { 0xF6E7, "periodinferior" }, /* SUBSCRIPT FULL STOP */
02747     { 0xF6E8, "periodsuperior" }, /* SUPERSCRIPT FULL STOP */
02748     { 0xF6E9, "asuperior" }, /* SUPERSCRIPT LATIN SMALL LETTER A */
02749     { 0xF6EA, "bsuperior" }, /* SUPERSCRIPT LATIN SMALL LETTER B */
02750     { 0xF6EB, "dsuperior" }, /* SUPERSCRIPT LATIN SMALL LETTER D */
02751     { 0xF6EC, "esuperior" }, /* SUPERSCRIPT LATIN SMALL LETTER E */
02752     { 0xF6ED, "isuperior" }, /* SUPERSCRIPT LATIN SMALL LETTER I */
02753     { 0xF6EE, "lsuperior" }, /* SUPERSCRIPT LATIN SMALL LETTER L */
02754     { 0xF6EF, "msuperior" }, /* SUPERSCRIPT LATIN SMALL LETTER M */
02755     { 0xF6F0, "osuperior" }, /* SUPERSCRIPT LATIN SMALL LETTER O */
02756     { 0xF6F1, "rsuperior" }, /* SUPERSCRIPT LATIN SMALL LETTER R */
02757     { 0xF6F2, "ssuperior" }, /* SUPERSCRIPT LATIN SMALL LETTER S */
02758     { 0xF6F3, "tsuperior" }, /* SUPERSCRIPT LATIN SMALL LETTER T */
02759     { 0xF6F4, "Brevesmall" }, /* SMALL CAPITAL BREVE */
02760     { 0xF6F5, "Caronsmall" }, /* SMALL CAPITAL CARON */
02761     { 0xF6F6, "Circumflexsmall" }, /* SMALL CAPITAL MODIFIER LETTER CIRCUMFLEX ACCENT */
02762     { 0xF6F7, "Dotaccentsmall" }, /* SMALL CAPITAL DOT ABOVE */
02763     { 0xF6F8, "Hungarumlautsmall" }, /* SMALL CAPITAL DOUBLE ACUTE ACCENT */
02764     { 0xF6F9, "Lslashsmall" }, /* LATIN SMALL CAPITAL LETTER L WITH STROKE */
02765     { 0xF6FA, "OEsmall" }, /* LATIN SMALL CAPITAL LIGATURE OE */
02766     { 0xF6FB, "Ogoneksmall" }, /* SMALL CAPITAL OGONEK */
02767     { 0xF6FC, "Ringsmall" }, /* SMALL CAPITAL RING ABOVE */
02768     { 0xF6FD, "Scaronsmall" }, /* LATIN SMALL CAPITAL LETTER S WITH CARON */
02769     { 0xF6FE, "Tildesmall" }, /* SMALL CAPITAL SMALL TILDE */
02770     { 0xF6FF, "Zcaronsmall" }, /* LATIN SMALL CAPITAL LETTER Z WITH CARON */
02771     { 0xF721, "exclamsmall" }, /* SMALL CAPITAL EXCLAMATION MARK */
02772     { 0xF724, "dollaroldstyle" }, /* OLDSTYLE DOLLAR SIGN */
02773     { 0xF726, "ampersandsmall" }, /* SMALL CAPITAL AMPERSAND */
02774     { 0xF730, "zerooldstyle" }, /* OLDSTYLE DIGIT ZERO */
02775     { 0xF731, "oneoldstyle" }, /* OLDSTYLE DIGIT ONE */
02776     { 0xF732, "twooldstyle" }, /* OLDSTYLE DIGIT TWO */
02777     { 0xF733, "threeoldstyle" }, /* OLDSTYLE DIGIT THREE */
02778     { 0xF734, "fouroldstyle" }, /* OLDSTYLE DIGIT FOUR */
02779     { 0xF735, "fiveoldstyle" }, /* OLDSTYLE DIGIT FIVE */
02780     { 0xF736, "sixoldstyle" }, /* OLDSTYLE DIGIT SIX */
02781     { 0xF737, "sevenoldstyle" }, /* OLDSTYLE DIGIT SEVEN */
02782     { 0xF738, "eightoldstyle" }, /* OLDSTYLE DIGIT EIGHT */
02783     { 0xF739, "nineoldstyle" }, /* OLDSTYLE DIGIT NINE */
02784     { 0xF73F, "questionsmall" }, /* SMALL CAPITAL QUESTION MARK */
02785     { 0xF760, "Gravesmall" }, /* SMALL CAPITAL GRAVE ACCENT */
02786     { 0xF761, "Asmall" }, /* LATIN SMALL CAPITAL LETTER A */
02787     { 0xF762, "Bsmall" }, /* LATIN SMALL CAPITAL LETTER B */
02788     { 0xF763, "Csmall" }, /* LATIN SMALL CAPITAL LETTER C */
02789     { 0xF764, "Dsmall" }, /* LATIN SMALL CAPITAL LETTER D */
02790     { 0xF765, "Esmall" }, /* LATIN SMALL CAPITAL LETTER E */
02791     { 0xF766, "Fsmall" }, /* LATIN SMALL CAPITAL LETTER F */
02792     { 0xF767, "Gsmall" }, /* LATIN SMALL CAPITAL LETTER G */
02793     { 0xF768, "Hsmall" }, /* LATIN SMALL CAPITAL LETTER H */
02794     { 0xF769, "Ismall" }, /* LATIN SMALL CAPITAL LETTER I */
02795     { 0xF76A, "Jsmall" }, /* LATIN SMALL CAPITAL LETTER J */
02796     { 0xF76B, "Ksmall" }, /* LATIN SMALL CAPITAL LETTER K */
02797     { 0xF76C, "Lsmall" }, /* LATIN SMALL CAPITAL LETTER L */
02798     { 0xF76D, "Msmall" }, /* LATIN SMALL CAPITAL LETTER M */
02799     { 0xF76E, "Nsmall" }, /* LATIN SMALL CAPITAL LETTER N */
02800     { 0xF76F, "Osmall" }, /* LATIN SMALL CAPITAL LETTER O */
02801     { 0xF770, "Psmall" }, /* LATIN SMALL CAPITAL LETTER P */
02802     { 0xF771, "Qsmall" }, /* LATIN SMALL CAPITAL LETTER Q */
02803     { 0xF772, "Rsmall" }, /* LATIN SMALL CAPITAL LETTER R */
02804     { 0xF773, "Ssmall" }, /* LATIN SMALL CAPITAL LETTER S */
02805     { 0xF774, "Tsmall" }, /* LATIN SMALL CAPITAL LETTER T */
02806     { 0xF775, "Usmall" }, /* LATIN SMALL CAPITAL LETTER U */
02807     { 0xF776, "Vsmall" }, /* LATIN SMALL CAPITAL LETTER V */
02808     { 0xF777, "Wsmall" }, /* LATIN SMALL CAPITAL LETTER W */
02809     { 0xF778, "Xsmall" }, /* LATIN SMALL CAPITAL LETTER X */
02810     { 0xF779, "Ysmall" }, /* LATIN SMALL CAPITAL LETTER Y */
02811     { 0xF77A, "Zsmall" }, /* LATIN SMALL CAPITAL LETTER Z */
02812     { 0xF7A1, "exclamdownsmall" }, /* SMALL CAPITAL INVERTED EXCLAMATION MARK */
02813     { 0xF7A2, "centoldstyle" }, /* OLDSTYLE CENT SIGN */
02814     { 0xF7A8, "Dieresissmall" }, /* SMALL CAPITAL DIAERESIS */
02815     { 0xF7AF, "Macronsmall" }, /* SMALL CAPITAL MACRON */
02816     { 0xF7B4, "Acutesmall" }, /* SMALL CAPITAL ACUTE ACCENT */
02817     { 0xF7B8, "Cedillasmall" }, /* SMALL CAPITAL CEDILLA */
02818     { 0xF7BF, "questiondownsmall" }, /* SMALL CAPITAL INVERTED QUESTION MARK */
02819     { 0xF7E0, "Agravesmall" }, /* LATIN SMALL CAPITAL LETTER A WITH GRAVE */
02820     { 0xF7E1, "Aacutesmall" }, /* LATIN SMALL CAPITAL LETTER A WITH ACUTE */
02821     { 0xF7E2, "Acircumflexsmall" }, /* LATIN SMALL CAPITAL LETTER A WITH CIRCUMFLEX */
02822     { 0xF7E3, "Atildesmall" }, /* LATIN SMALL CAPITAL LETTER A WITH TILDE */
02823     { 0xF7E4, "Adieresissmall" }, /* LATIN SMALL CAPITAL LETTER A WITH DIAERESIS */
02824     { 0xF7E5, "Aringsmall" }, /* LATIN SMALL CAPITAL LETTER A WITH RING ABOVE */
02825     { 0xF7E6, "AEsmall" }, /* LATIN SMALL CAPITAL LETTER AE */
02826     { 0xF7E7, "Ccedillasmall" }, /* LATIN SMALL CAPITAL LETTER C WITH CEDILLA */
02827     { 0xF7E8, "Egravesmall" }, /* LATIN SMALL CAPITAL LETTER E WITH GRAVE */
02828     { 0xF7E9, "Eacutesmall" }, /* LATIN SMALL CAPITAL LETTER E WITH ACUTE */
02829     { 0xF7EA, "Ecircumflexsmall" }, /* LATIN SMALL CAPITAL LETTER E WITH CIRCUMFLEX */
02830     { 0xF7EB, "Edieresissmall" }, /* LATIN SMALL CAPITAL LETTER E WITH DIAERESIS */
02831     { 0xF7EC, "Igravesmall" }, /* LATIN SMALL CAPITAL LETTER I WITH GRAVE */
02832     { 0xF7ED, "Iacutesmall" }, /* LATIN SMALL CAPITAL LETTER I WITH ACUTE */
02833     { 0xF7EE, "Icircumflexsmall" }, /* LATIN SMALL CAPITAL LETTER I WITH CIRCUMFLEX */
02834     { 0xF7EF, "Idieresissmall" }, /* LATIN SMALL CAPITAL LETTER I WITH DIAERESIS */
02835     { 0xF7F0, "Ethsmall" }, /* LATIN SMALL CAPITAL LETTER ETH */
02836     { 0xF7F1, "Ntildesmall" }, /* LATIN SMALL CAPITAL LETTER N WITH TILDE */
02837     { 0xF7F2, "Ogravesmall" }, /* LATIN SMALL CAPITAL LETTER O WITH GRAVE */
02838     { 0xF7F3, "Oacutesmall" }, /* LATIN SMALL CAPITAL LETTER O WITH ACUTE */
02839     { 0xF7F4, "Ocircumflexsmall" }, /* LATIN SMALL CAPITAL LETTER O WITH CIRCUMFLEX */
02840     { 0xF7F5, "Otildesmall" }, /* LATIN SMALL CAPITAL LETTER O WITH TILDE */
02841     { 0xF7F6, "Odieresissmall" }, /* LATIN SMALL CAPITAL LETTER O WITH DIAERESIS */
02842     { 0xF7F8, "Oslashsmall" }, /* LATIN SMALL CAPITAL LETTER O WITH STROKE */
02843     { 0xF7F9, "Ugravesmall" }, /* LATIN SMALL CAPITAL LETTER U WITH GRAVE */
02844     { 0xF7FA, "Uacutesmall" }, /* LATIN SMALL CAPITAL LETTER U WITH ACUTE */
02845     { 0xF7FB, "Ucircumflexsmall" }, /* LATIN SMALL CAPITAL LETTER U WITH CIRCUMFLEX */
02846     { 0xF7FC, "Udieresissmall" }, /* LATIN SMALL CAPITAL LETTER U WITH DIAERESIS */
02847     { 0xF7FD, "Yacutesmall" }, /* LATIN SMALL CAPITAL LETTER Y WITH ACUTE */
02848     { 0xF7FE, "Thornsmall" }, /* LATIN SMALL CAPITAL LETTER THORN */
02849     { 0xF7FF, "Ydieresissmall" }, /* LATIN SMALL CAPITAL LETTER Y WITH DIAERESIS */
02850     { 0xF8E5, "radicalex" }, /* RADICAL EXTENDER */
02851     { 0xF8E6, "arrowvertex" }, /* VERTICAL ARROW EXTENDER */
02852     { 0xF8E7, "arrowhorizex" }, /* HORIZONTAL ARROW EXTENDER */
02853     { 0xF8E8, "registersans" }, /* REGISTERED SIGN SANS SERIF */
02854     { 0xF8E9, "copyrightsans" }, /* COPYRIGHT SIGN SANS SERIF */
02855     { 0xF8EA, "trademarksans" }, /* TRADE MARK SIGN SANS SERIF */
02856     { 0xF8EB, "parenlefttp" }, /* LEFT PAREN TOP */
02857     { 0xF8EC, "parenleftex" }, /* LEFT PAREN EXTENDER */
02858     { 0xF8ED, "parenleftbt" }, /* LEFT PAREN BOTTOM */
02859     { 0xF8EE, "bracketlefttp" }, /* LEFT SQUARE BRACKET TOP */
02860     { 0xF8EF, "bracketleftex" }, /* LEFT SQUARE BRACKET EXTENDER */
02861     { 0xF8F0, "bracketleftbt" }, /* LEFT SQUARE BRACKET BOTTOM */
02862     { 0xF8F1, "bracelefttp" }, /* LEFT CURLY BRACKET TOP */
02863     { 0xF8F2, "braceleftmid" }, /* LEFT CURLY BRACKET MID */
02864     { 0xF8F3, "braceleftbt" }, /* LEFT CURLY BRACKET BOTTOM */
02865     { 0xF8F4, "braceex" }, /* CURLY BRACKET EXTENDER */
02866     { 0xF8F5, "integralex" }, /* INTEGRAL EXTENDER */
02867     { 0xF8F6, "parenrighttp" }, /* RIGHT PAREN TOP */
02868     { 0xF8F7, "parenrightex" }, /* RIGHT PAREN EXTENDER */
02869     { 0xF8F8, "parenrightbt" }, /* RIGHT PAREN BOTTOM */
02870     { 0xF8F9, "bracketrighttp" }, /* RIGHT SQUARE BRACKET TOP */
02871     { 0xF8FA, "bracketrightex" }, /* RIGHT SQUARE BRACKET EXTENDER */
02872     { 0xF8FB, "bracketrightbt" }, /* RIGHT SQUARE BRACKET BOTTOM */
02873     { 0xF8FC, "bracerighttp" }, /* RIGHT CURLY BRACKET TOP */
02874     { 0xF8FD, "bracerightmid" }, /* RIGHT CURLY BRACKET MID */
02875     { 0xF8FE, "bracerightbt" }, /* RIGHT CURLY BRACKET BOTTOM */
02876     { 0xFB00, "ff" }, /* LATIN SMALL LIGATURE FF */
02877     { 0xFB01, "fi" }, /* LATIN SMALL LIGATURE FI */
02878     { 0xFB02, "fl" }, /* LATIN SMALL LIGATURE FL */
02879     { 0xFB03, "ffi" }, /* LATIN SMALL LIGATURE FFI */
02880     { 0xFB04, "ffl" }, /* LATIN SMALL LIGATURE FFL */
02881     { 0xFB05, "$longst" }, /* LATIN SMALL LIGATURE LONG S T */
02882     { 0xFB06, "$st" }, /* LATIN SMALL LIGATURE ST */
02883     { 0xFB1F, "afii57705" }, /* HEBREW LIGATURE YIDDISH YOD YOD PATAH */
02884     { 0xFB2A, "afii57694" }, /* HEBREW LETTER SHIN WITH SHIN DOT */
02885     { 0xFB2B, "afii57695" }, /* HEBREW LETTER SHIN WITH SIN DOT */
02886     { 0xFB35, "afii57723" }, /* HEBREW LETTER VAV WITH DAGESH */
02887     { 0xFB4B, "afii57700" } /* HEBREW LETTER VAV WITH HOLAM */
02888 };
02889 #endif /* 0 */
02890 
02891 static int
02892 adobe_name_cmp(const void *s1, const void *s2)
02893 {
02894     const struct adobe2unicode *a = s1;
02895     const struct adobe2unicode *b = s2;
02896     
02897     return strcmp(a->adobe_name, b->adobe_name);
02898 }
02899 
02900 #if 0
02901 static int
02902 unicode_id_cmp(const void *s1, const void *s2)
02903 {
02904     const struct unicode2adobe *a = s1;
02905     const struct unicode2adobe *b = s2;
02906 
02907     return a->unicode - b->unicode;
02908 }
02909 #endif /* 0 */
02910 
02911 void
02912 close_iconv(void)
02913 {
02914 #if HAVE_ICONV_H
02915     if (m_iconv_gb_ucs4 != (iconv_t)(-1)) {
02916        iconv_close(m_iconv_gb_ucs4);
02917        m_iconv_gb_ucs4 = (iconv_t)(-1);
02918     }
02919 #endif /* HAVE_ICONV_H */
02920 }
02921 
02922 #if HAVE_ICONV_H
02923 /* convert a CJK char to unicode (UCS-4) using iconv() */
02924 static uint32_t
02925 cjk2unicode(const unsigned char *cjk)
02926 {
02927     uint32_t u = 0;
02928     unsigned char unicode[4];
02929     size_t from = 2;
02930     size_t to = sizeof unicode;
02931     static Boolean initialized = False;
02932     char *from_ptr = (char *)cjk;
02933     char *to_ptr = (char *)unicode;
02934     
02935     if (m_iconv_gb_ucs4 == (iconv_t)(-1)) {
02936        if (initialized)
02937            return 0;
02938        initialized = True;
02939        m_iconv_gb_ucs4 = iconv_open(
02940 #ifdef WORDS_BIGENDIAN
02941                                  "UCS-4BE",
02942 #else
02943                                  "UCS-4LE",
02944 #endif
02945                                  "GB18030");
02946        if (m_iconv_gb_ucs4 == (iconv_t)(-1)) {
02947            XDVI_ERROR((stderr, "cjk2unicode: iconv_open() failed: %s", strerror(errno)));
02948            return 0;
02949        }
02950     }
02951     if (iconv(m_iconv_gb_ucs4, (iconv_char_pptrT)&from_ptr, &from, &to_ptr, &to) == (size_t)(-1)) {
02952        XDVI_ERROR((stderr, "cjk2unicode: can't convert GBK to unicode: %s", strerror(errno)));
02953        return 0;
02954     }
02955     memcpy(&u, unicode, sizeof unicode);
02956     return u;
02957 }
02958 #endif /* HAVE_ICONV_H */
02959 
02960 /*
02961  * Return the unicode ID of adobe_name, or 0 if it isn't found.
02962  * Uses the lookup table adobe2unicode_table, or iconv for CJK fonts.
02963  */
02964 uint32_t
02965 adobe2unicode_name(const char *adobe_name)
02966 {
02967     struct adobe2unicode search_item;
02968     struct adobe2unicode *match_item;
02969 
02970     if (memcmp(adobe_name, "cjk", 3) == 0) {
02971 #if HAVE_ICONV_H
02972        /* Special case for CJK fonts (Chinese) - ZLB: the Adobe names in
02973         * the Chinese T1 fonts are of the form 'cjkXXXX' where 'XXXX' are
02974         * the hex number of the GBK/GB18030 encoding */
02975        unsigned char cjk[2], xx[3];
02976        xx[0] = adobe_name[3];
02977        xx[1] = adobe_name[4];
02978        xx[2] = '\0';
02979        cjk[0] = strtoul((char *)xx, NULL, 16);
02980        xx[0] = adobe_name[5];
02981        xx[1] = adobe_name[6];
02982        cjk[1] = strtoul((char *)xx, NULL, 16);
02983        /* convert GBK ==> unicode */
02984        return cjk2unicode(cjk);
02985 #else /* HAVE_ICONV_H */
02986        if (!warned_about_cjk) {
02987            popup_message(globals.widgets.top_level,
02988                        MSG_WARN, NULL, "This version of xdvi has been compiled without iconv support - "
02989                        "cannot convert CJK character to UTF-8");
02990            warned_about_cjk = True;
02991        }
02992        return 0;
02993 #endif /* HAVE_ICONV_H */
02994     }
02995     else {
02996        search_item.adobe_name = adobe_name;
02997     
02998        match_item = bsearch(&search_item, adobe2unicode_table,
02999                           sizeof adobe2unicode_table / sizeof adobe2unicode_table[0],
03000                           sizeof adobe2unicode_table[0],
03001                           adobe_name_cmp);
03002        if (match_item != NULL)
03003            return match_item->unicode;
03004        else
03005            return 0;
03006     }
03007 }
03008 
03009 #if 0
03010 /*
03011  * Return the adobe_name of unicode ID, or NULL if it isn't found.
03012  * Uses the lookup table unicode2adobe_table.
03013  */
03014 const char *
03015 unicode2adobe_name(uint32_t unicode)
03016 {
03017     struct unicode2adobe search_item;
03018     struct unicode2adobe *match_item;
03019     
03020     search_item.unicode = unicode;
03021     
03022     match_item = bsearch(&search_item, unicode2adobe_table,
03023                       sizeof unicode2adobe_table / sizeof unicode2adobe_table[0],
03024                       sizeof unicode2adobe_table[0],
03025                       unicode_id_cmp);
03026     if (match_item != NULL)
03027        return match_item->adobe_name;
03028     else
03029        return NULL;
03030 }
03031 #endif /* 0 */
03032 
03033 
03034 static uint32_t
03035 ucs4_lowercase(uint32_t c)
03036 {
03037     /*
03038       This table was produced by:
03039       
03040       cat uni2adobe | while read a b; do lc_b=`echo $b | tr 'A-Z' 'a-z'`; \
03041       if [ "$lc_b" != "$b" ] ; then res=`egrep " $lc_b\$" uni2adobe` ; \
03042       if [ -n "$res" ]; then echo "RES: $a $b -> $res"; fi; fi; done | grep 'RES' > uni2adobe-map
03043 
03044       And then, some Emacs keyboard macros.
03045      */
03046     switch (c) {
03047     case 0x0041: /* A */                return 0x0061; /* a */
03048     case 0x0042: /* B */                return 0x0062; /* b */
03049     case 0x0043: /* C */                return 0x0063; /* c */
03050     case 0x0044: /* D */                return 0x0064; /* d */
03051     case 0x0045: /* E */                return 0x0065; /* e */
03052     case 0x0046: /* F */                return 0x0066; /* f */
03053     case 0x0047: /* G */                return 0x0067; /* g */
03054     case 0x0048: /* H */                return 0x0068; /* h */
03055     case 0x0049: /* I */                return 0x0069; /* i */
03056     case 0x004A: /* J */                return 0x006A; /* j */
03057     case 0x004B: /* K */                return 0x006B; /* k */
03058     case 0x004C: /* L */                return 0x006C; /* l */
03059     case 0x004D: /* M */                return 0x006D; /* m */
03060     case 0x004E: /* N */                return 0x006E; /* n */
03061     case 0x004F: /* O */                return 0x006F; /* o */
03062     case 0x0050: /* P */                return 0x0070; /* p */
03063     case 0x0051: /* Q */                return 0x0071; /* q */
03064     case 0x0052: /* R */                return 0x0072; /* r */
03065     case 0x0053: /* S */                return 0x0073; /* s */
03066     case 0x0054: /* T */                return 0x0074; /* t */
03067     case 0x0055: /* U */                return 0x0075; /* u */
03068     case 0x0056: /* V */                return 0x0076; /* v */
03069     case 0x0057: /* W */                return 0x0077; /* w */
03070     case 0x0058: /* X */                return 0x0078; /* x */
03071     case 0x0059: /* Y */                return 0x0079; /* y */
03072     case 0x005A: /* Z */                return 0x007A; /* z */
03073     case 0x00C0: /* Agrave */           return 0x00E0; /* agrave */
03074     case 0x00C1: /* Aacute */           return 0x00E1; /* aacute */
03075     case 0x00C2: /* Acircumflex */      return 0x00E2; /* acircumflex */
03076     case 0x00C3: /* Atilde */           return 0x00E3; /* atilde */
03077     case 0x00C4: /* Adieresis */        return 0x00E4; /* adieresis */
03078     case 0x00C5: /* Aring */            return 0x00E5; /* aring */
03079     case 0x00C6: /* AE */               return 0x00E6; /* ae */
03080     case 0x00C7: /* Ccedilla */         return 0x00E7; /* ccedilla */
03081     case 0x00C8: /* Egrave */           return 0x00E8; /* egrave */
03082     case 0x00C9: /* Eacute */           return 0x00E9; /* eacute */
03083     case 0x00CA: /* Ecircumflex */      return 0x00EA; /* ecircumflex */
03084     case 0x00CB: /* Edieresis */        return 0x00EB; /* edieresis */
03085     case 0x00CC: /* Igrave */           return 0x00EC; /* igrave */
03086     case 0x00CD: /* Iacute */           return 0x00ED; /* iacute */
03087     case 0x00CE: /* Icircumflex */      return 0x00EE; /* icircumflex */
03088     case 0x00CF: /* Idieresis */        return 0x00EF; /* idieresis */
03089     case 0x00D0: /* Eth */              return 0x00F0; /* eth */
03090     case 0x00D1: /* Ntilde */           return 0x00F1; /* ntilde */
03091     case 0x00D2: /* Ograve */           return 0x00F2; /* ograve */
03092     case 0x00D3: /* Oacute */           return 0x00F3; /* oacute */
03093     case 0x00D4: /* Ocircumflex */      return 0x00F4; /* ocircumflex */
03094     case 0x00D5: /* Otilde */           return 0x00F5; /* otilde */
03095     case 0x00D6: /* Odieresis */        return 0x00F6; /* odieresis */
03096     case 0x00D8: /* Oslash */           return 0x00F8; /* oslash */
03097     case 0x00D9: /* Ugrave */           return 0x00F9; /* ugrave */
03098     case 0x00DA: /* Uacute */           return 0x00FA; /* uacute */
03099     case 0x00DB: /* Ucircumflex */      return 0x00FB; /* ucircumflex */
03100     case 0x00DC: /* Udieresis */        return 0x00FC; /* udieresis */
03101     case 0x00DD: /* Yacute */           return 0x00FD; /* yacute */
03102     case 0x00DE: /* Thorn */            return 0x00FE; /* thorn */
03103     case 0x0100: /* Amacron */          return 0x0101; /* amacron */
03104     case 0x0102: /* Abreve */           return 0x0103; /* abreve */
03105     case 0x0104: /* Aogonek */          return 0x0105; /* aogonek */
03106     case 0x0106: /* Cacute */           return 0x0107; /* cacute */
03107     case 0x0108: /* Ccircumflex */      return 0x0109; /* ccircumflex */
03108     case 0x010A: /* Cdotaccent */       return 0x010B; /* cdotaccent */
03109     case 0x010C: /* Ccaron */           return 0x010D; /* ccaron */
03110     case 0x010E: /* Dcaron */           return 0x010F; /* dcaron */
03111     case 0x0110: /* Dcroat */           return 0x0111; /* dcroat */
03112     case 0x0112: /* Emacron */          return 0x0113; /* emacron */
03113     case 0x0114: /* Ebreve */           return 0x0115; /* ebreve */
03114     case 0x0116: /* Edotaccent */       return 0x0117; /* edotaccent */
03115     case 0x0118: /* Eogonek */          return 0x0119; /* eogonek */
03116     case 0x011A: /* Ecaron */           return 0x011B; /* ecaron */
03117     case 0x011C: /* Gcircumflex */      return 0x011D; /* gcircumflex */
03118     case 0x011E: /* Gbreve */           return 0x011F; /* gbreve */
03119     case 0x0120: /* Gdotaccent */       return 0x0121; /* gdotaccent */
03120     case 0x0122: /* Gcommaaccent */     return 0x0123; /* gcommaaccent */
03121     case 0x0124: /* Hcircumflex */      return 0x0125; /* hcircumflex */
03122     case 0x0126: /* Hbar */             return 0x0127; /* hbar */
03123     case 0x0128: /* Itilde */           return 0x0129; /* itilde */
03124     case 0x012A: /* Imacron */          return 0x012B; /* imacron */
03125     case 0x012C: /* Ibreve */           return 0x012D; /* ibreve */
03126     case 0x012E: /* Iogonek */          return 0x012F; /* iogonek */
03127     case 0x0132: /* IJ */               return 0x0133; /* ij */
03128     case 0x0134: /* Jcircumflex */      return 0x0135; /* jcircumflex */
03129     case 0x0136: /* Kcommaaccent */     return 0x0137; /* kcommaaccent */
03130     case 0x0139: /* Lacute */           return 0x013A; /* lacute */
03131     case 0x013B: /* Lcommaaccent */     return 0x013C; /* lcommaaccent */
03132     case 0x013D: /* Lcaron */           return 0x013E; /* lcaron */
03133     case 0x013F: /* Ldot */             return 0x0140; /* ldot */
03134     case 0x0141: /* Lslash */           return 0x0142; /* lslash */
03135     case 0x0143: /* Nacute */           return 0x0144; /* nacute */
03136     case 0x0145: /* Ncommaaccent */     return 0x0146; /* ncommaaccent */
03137     case 0x0147: /* Ncaron */           return 0x0148; /* ncaron */
03138     case 0x014A: /* Eng */              return 0x014B; /* eng */
03139     case 0x014C: /* Omacron */          return 0x014D; /* omacron */
03140     case 0x014E: /* Obreve */           return 0x014F; /* obreve */
03141     case 0x0150: /* Ohungarumlaut */    return 0x0151; /* ohungarumlaut */
03142     case 0x0152: /* OE */               return 0x0153; /* oe */
03143     case 0x0154: /* Racute */           return 0x0155; /* racute */
03144     case 0x0156: /* Rcommaaccent */     return 0x0157; /* rcommaaccent */
03145     case 0x0158: /* Rcaron */           return 0x0159; /* rcaron */
03146     case 0x015A: /* Sacute */           return 0x015B; /* sacute */
03147     case 0x015C: /* Scircumflex */      return 0x015D; /* scircumflex */
03148     case 0x015E: /* Scedilla */         return 0x015F; /* scedilla */
03149     case 0x0160: /* Scaron */           return 0x0161; /* scaron */
03150     case 0x0162: /* Tcommaaccent */     return 0x0163; /* tcommaaccent */
03151     case 0x0164: /* Tcaron */           return 0x0165; /* tcaron */
03152     case 0x0166: /* Tbar */             return 0x0167; /* tbar */
03153     case 0x0168: /* Utilde */           return 0x0169; /* utilde */
03154     case 0x016A: /* Umacron */          return 0x016B; /* umacron */
03155     case 0x016C: /* Ubreve */           return 0x016D; /* ubreve */
03156     case 0x016E: /* Uring */            return 0x016F; /* uring */
03157     case 0x0170: /* Uhungarumlaut */    return 0x0171; /* uhungarumlaut */
03158     case 0x0172: /* Uogonek */          return 0x0173; /* uogonek */
03159     case 0x0174: /* Wcircumflex */      return 0x0175; /* wcircumflex */
03160     case 0x0176: /* Ycircumflex */      return 0x0177; /* ycircumflex */
03161     case 0x0178: /* Ydieresis */        return 0x00FF; /* ydieresis */
03162     case 0x0179: /* Zacute */           return 0x017A; /* zacute */
03163     case 0x017B: /* Zdotaccent */       return 0x017C; /* zdotaccent */
03164     case 0x017D: /* Zcaron */           return 0x017E; /* zcaron */
03165     case 0x01A0: /* Ohorn */            return 0x01A1; /* ohorn */
03166     case 0x01AF: /* Uhorn */            return 0x01B0; /* uhorn */
03167     case 0x01E6: /* Gcaron */           return 0x01E7; /* gcaron */
03168     case 0x01FA: /* Aringacute */       return 0x01FB; /* aringacute */
03169     case 0x01FC: /* AEacute */          return 0x01FD; /* aeacute */
03170     case 0x01FE: /* Oslashacute */      return 0x01FF; /* oslashacute */
03171     case 0x0218: /* Scommaaccent */     return 0x0219; /* scommaaccent */
03172     case 0x0386: /* Alphatonos */       return 0x03AC; /* alphatonos */
03173     case 0x0388: /* Epsilontonos */     return 0x03AD; /* epsilontonos */
03174     case 0x0389: /* Etatonos */         return 0x03AE; /* etatonos */
03175     case 0x038A: /* Iotatonos */        return 0x03AF; /* iotatonos */
03176     case 0x038C: /* Omicrontonos */     return 0x03CC; /* omicrontonos */
03177     case 0x038E: /* Upsilontonos */     return 0x03CD; /* upsilontonos */
03178     case 0x038F: /* Omegatonos */       return 0x03CE; /* omegatonos */
03179     case 0x0391: /* Alpha */            return 0x03B1; /* alpha */
03180     case 0x0392: /* Beta */             return 0x03B2; /* beta */
03181     case 0x0393: /* Gamma */            return 0x03B3; /* gamma */
03182     case 0x0395: /* Epsilon */          return 0x03B5; /* epsilon */
03183     case 0x0396: /* Zeta */             return 0x03B6; /* zeta */
03184     case 0x0397: /* Eta */              return 0x03B7; /* eta */
03185     case 0x0398: /* Theta */            return 0x03B8; /* theta */
03186     case 0x0399: /* Iota */             return 0x03B9; /* iota */
03187     case 0x039A: /* Kappa */            return 0x03BA; /* kappa */
03188     case 0x039B: /* Lambda */           return 0x03BB; /* lambda */
03189     case 0x039C: /* Mu */               return 0x00B5; /* mu */
03190     case 0x039D: /* Nu */               return 0x03BD; /* nu */
03191     case 0x039E: /* Xi */               return 0x03BE; /* xi */
03192     case 0x039F: /* Omicron */          return 0x03BF; /* omicron */
03193     case 0x03A0: /* Pi */               return 0x03C0; /* pi */
03194     case 0x03A1: /* Rho */              return 0x03C1; /* rho */
03195     case 0x03A3: /* Sigma */            return 0x03C3; /* sigma */
03196     case 0x03A4: /* Tau */              return 0x03C4; /* tau */
03197     case 0x03A5: /* Upsilon */          return 0x03C5; /* upsilon */
03198     case 0x03A6: /* Phi */              return 0x03C6; /* phi */
03199     case 0x03A7: /* Chi */              return 0x03C7; /* chi */
03200     case 0x03A8: /* Psi */              return 0x03C8; /* psi */
03201     case 0x03AA: /* Iotadieresis */     return 0x03CA; /* iotadieresis */
03202     case 0x03AB: /* Upsilondieresis */  return 0x03CB; /* upsilondieresis */
03203     case 0x1E80: /* Wgrave */           return 0x1E81; /* wgrave */
03204     case 0x1E82: /* Wacute */           return 0x1E83; /* wacute */
03205     case 0x1E84: /* Wdieresis */        return 0x1E85; /* wdieresis */
03206     case 0x1EF2: /* Ygrave */           return 0x1EF3; /* ygrave */
03207     case 0x2126: /* Omega */            return 0x03C9; /* omega */
03208     case 0x2206: /* Delta */            return 0x03B4; /* delta */
03209     case 0xF6BF: /* LL */               return 0xF6C0; /* ll */
03210     case 0xF6C9: /* Acute */            return 0x00B4; /* acute */
03211     case 0xF6CA: /* Caron */            return 0x02C7; /* caron */
03212     case 0xF6CB: /* Dieresis */         return 0x00A8; /* dieresis */
03213     case 0xF6CC: /* DieresisAcute */    return 0xF6D7; /* dieresisacute */
03214     case 0xF6CD: /* DieresisGrave */    return 0xF6D8; /* dieresisgrave */
03215     case 0xF6CE: /* Grave */            return 0x0060; /* grave */
03216     case 0xF6CF: /* Hungarumlaut */     return 0x02DD; /* hungarumlaut */
03217     case 0xF6D0: /* Macron */           return 0x00AF; /* macron */
03218     case 0xF6D1: /* cyrBreve */         return 0xF6D4; /* cyrbreve */
03219     case 0xF6D2: /* cyrFlex */          return 0xF6D5; /* cyrflex */
03220     case 0xF6D3: /* dblGrave */         return 0xF6D6; /* dblgrave */
03221     default: return c;
03222     }
03223 }
03224 
03225 /*
03226  * For the unicode IDs of an accent and a base_glyph, return the
03227  * unicode ID of the composed (accented) glyph. If there is no
03228  * suitable composed glyph, return 0.
03229  */
03230 uint32_t
03231 get_accented_glyph(uint32_t accent, uint32_t base_glyph)
03232 {
03233     TRACE_FIND((stderr, "get_accented_glyph: %lu, %lu",
03234               (unsigned long)accent, (unsigned long)base_glyph));
03235     switch(accent) {
03236     case 0x0060: /* grave */
03237        switch (base_glyph) {
03238        case 0x0041: /* A */ return 0x00C0;
03239        case 0x0045: /* E */ return 0x00C8;
03240        case 0x0049: /* I */ return 0x00CC;
03241        case 0x004F: /* O */ return 0x00D2;
03242        case 0x0055: /* U */ return 0x00D9;
03243        case 0x0057: /* W */ return 0x1E80;
03244        case 0x0059: /* Y */ return 0x1EF2;
03245        case 0x0061: /* a */ return 0x00E0;
03246        case 0x0065: /* e */ return 0x00E8;
03247        case 0x0069: /* i */ return 0x00EC;
03248        case 0x006F: /* o */ return 0x00F2;
03249        case 0x0075: /* u */ return 0x00F9;
03250        case 0x0077: /* w */ return 0x1E81;
03251        case 0x0079: /* y */ return 0x1EF3;
03252        default: return 0;
03253        }
03254     case 0x00B4: /* acute */
03255        switch (base_glyph) {
03256        case 0x0041: /* A */ return 0x00C1;
03257        case 0x0043: /* C */ return 0x0106;
03258        case 0x0045: /* E */ return 0x00C9;
03259        case 0x0049: /* I */ return 0x00CD;
03260        case 0x004C: /* L */ return 0x0139;
03261        case 0x004E: /* N */ return 0x0143;
03262        case 0x004F: /* O */ return 0x00D3;
03263        case 0x0052: /* R */ return 0x0154;
03264        case 0x0053: /* S */ return 0x015A;
03265        case 0x0055: /* U */ return 0x00DA;
03266        case 0x0057: /* W */ return 0x1E82;
03267        case 0x0059: /* Y */ return 0x00DD;
03268        case 0x0060: /* Z */ return 0x0179;
03269        case 0x0061: /* a */ return 0x00E1;
03270        case 0x0063: /* c */ return 0x0107;
03271        case 0x0065: /* e */ return 0x00E9;
03272        case 0x0069: /* i */ return 0x00ED;
03273        case 0x006C: /* l */ return 0x013A;
03274        case 0x006E: /* n */ return 0x0144;
03275        case 0x006F: /* o */ return 0x00F3;
03276        case 0x0072: /* r */ return 0x0155;
03277        case 0x0073: /* s */ return 0x015B;
03278        case 0x0075: /* u */ return 0x00FA;
03279        case 0x0077: /* w */ return 0x1E83;
03280        case 0x0079: /* y */ return 0x00FD;
03281        case 0x0080: /* z */ return 0x017A;
03282        default: return 0;
03283        }
03284     case 0x02C6: /* circumflex */
03285     case 0x005E: /* asciicircum */
03286        switch (base_glyph) {
03287        case 0x0041: /* A */ return 0x00C2;
03288        case 0x0045: /* E */ return 0x00CA;
03289        case 0x0047: /* G */ return 0x011C;
03290        case 0x0048: /* H */ return 0x0124;
03291        case 0x0049: /* I */ return 0x00CE;
03292        case 0x0050: /* H */ return 0x0124;
03293        case 0x004F: /* O */ return 0x00D4;
03294        case 0x0055: /* U */ return 0x00DB;
03295        case 0x0061: /* a */ return 0x00E2;
03296        case 0x0065: /* e */ return 0x00EA;
03297        case 0x0067: /* g */ return 0x011D;
03298        case 0x0068: /* h */ return 0x0125;
03299        case 0x0069: /* i */ return 0x00EE;
03300        case 0x0070: /* j */ return 0x0135;
03301        case 0x006F: /* o */ return 0x00F4;
03302        case 0x0075: /* u */ return 0x00FB;
03303        default: return 0;
03304        }
03305     case 0x02DC: /* tilde */
03306     case 0x007E: /* asciitilde */
03307        switch (base_glyph) {
03308        case 0x0041: /* A */ return 0x00C3;
03309        case 0x0049: /* I */ return 0x0128;
03310        case 0x004E: /* N */ return 0x00D1;
03311        case 0x004F: /* O */ return 0x00D5;
03312        case 0x0055: /* U */ return 0x0168;
03313        case 0x0061: /* a */ return 0x00E3;
03314        case 0x0069: /* i */ return 0x0129;
03315        case 0x006E: /* n */ return 0x00F1;
03316        case 0x006F: /* o */ return 0x00F5;
03317        case 0x0075: /* u */ return 0x0169;
03318        default: return 0;
03319        }
03320     case 0x00A8: /* dieresis */
03321        switch (base_glyph) {
03322        case 0x0041: /* A */ return 0x00C4;
03323        case 0x0045: /* E */ return 0x00CB;
03324        case 0x0049: /* I */ return 0x00CF;
03325        case 0x004F: /* O */ return 0x00D6;
03326        case 0x0055: /* U */ return 0x00DC;
03327        case 0x0057: /* w */ return 0x1E84;
03328        case 0x0061: /* a */ return 0x00E4;
03329        case 0x0065: /* e */ return 0x00EB;
03330        case 0x0069: /* i */ return 0x00EF;
03331        case 0x006F: /* o */ return 0x00F6;
03332        case 0x0075: /* u */ return 0x00FC;
03333        case 0x0077: /* w */ return 0x1E85;
03334        case 0x0079: /* y */ return 0x00FF;
03335        default: return 0;
03336        }
03337     case 0x02DA: /* ring */
03338        switch (base_glyph) {
03339        case 0x0041: /* A */ return 0x00C5;
03340        case 0x0061: /* a */ return 0x00E5;
03341        case 0x0055: /* U */ return 0x016E;
03342        case 0x0075: /* u */ return 0x016F;
03343        default: return 0;
03344        }
03345     case 0x00B8: /* cedilla */
03346        switch (base_glyph) {
03347        case 0x0043: /* C */ return 0x00C7;
03348        case 0x0063: /* c */ return 0x00E7;
03349        case 0x0053: /* S */ return 0x015E;
03350        case 0x0073: /* s */ return 0x015F;
03351        default: return 0;
03352        }
03353     case 0x02DB: /* ogonek */
03354        switch (base_glyph) {
03355        case 0x0041: /* A */ return 0x0104;
03356        case 0x0045: /* E */ return 0x0118;
03357        case 0x0049: /* I */ return 0x012E;
03358        case 0x0055: /* U */ return 0x0172;
03359        case 0x0061: /* a */ return 0x0105;
03360        case 0x0065: /* e */ return 0x0119;
03361        case 0x0069: /* i */ return 0x012F;
03362        case 0x006F: /* o */ return 0x02DB;
03363        case 0x0075: /* u */ return 0x0173;
03364        default: return 0;
03365        }
03366     case 0x002F: /* solidus */
03367        switch (base_glyph) {
03368        case 0x004C: /* L */ return 0x0141;
03369        case 0x004F: /* O */ return 0x00D8;
03370        case 0x006C: /* l */ return 0x0142;
03371        case 0x006F: /* o */ return 0x00F8;
03372        default: return 0;
03373        }
03374     case 0x02C7: /* caron */
03375        switch (base_glyph) {
03376        case 0x0043: /* C */ return 0x010C;
03377        case 0x0044: /* D */ return 0x010E;
03378        case 0x0045: /* E */ return 0x011A;
03379        case 0x0047: /* G */ return 0x01E6;
03380        case 0x004C: /* L */ return 0x013D;
03381        case 0x004E: /* N */ return 0x0147;
03382        case 0x0052: /* R */ return 0x0158;
03383        case 0x0053: /* S */ return 0x0160;
03384        case 0x0054: /* T */ return 0x0164;
03385        case 0x005A: /* Z */ return 0x017D;
03386        case 0x0063: /* c */ return 0x010D;
03387        case 0x0064: /* d */ return 0x010F;
03388        case 0x0065: /* e */ return 0x011B;
03389        case 0x0067: /* g */ return 0x01E7;
03390        case 0x006C: /* l */ return 0x013E;
03391        case 0x006E: /* n */ return 0x0148;
03392        case 0x0072: /* r */ return 0x0159;
03393        case 0x0073: /* s */ return 0x0161;
03394        case 0x0074: /* t */ return 0x0165;
03395        case 0x007A: /* z */ return 0x017E;
03396        default: return 0;
03397        }
03398     case 0x02D8: /* breve */
03399        switch (base_glyph) {
03400        case 0x0041: /* A */ return 0x0102;
03401        case 0x0045: /* E */ return 0x0114;
03402        case 0x0047: /* G */ return 0x011E;
03403        case 0x0049: /* I */ return 0x012C;
03404        case 0x004F: /* O */ return 0x014E;
03405        case 0x0055: /* U */ return 0x016C;
03406        case 0x0061: /* a */ return 0x0103;
03407        case 0x0065: /* e */ return 0x0115;
03408        case 0x0067: /* g */ return 0x011F;
03409        case 0x0069: /* i */ return 0x012D;
03410        case 0x006F: /* o */ return 0x014F;
03411        case 0x0075: /* u */ return 0x016D;
03412        default: return 0;
03413        }      
03414     case 0x02DD: /* hungarumlaut */
03415        switch (base_glyph) {
03416        case 0x004F: /* O */ return 0x0150;
03417        case 0x0055: /* U */ return 0x0170;
03418        case 0x006F: /* o */ return 0x0151;
03419        case 0x0075: /* u */ return 0x0171;
03420        default: return 0;
03421        }
03422     case 0x00AF: /* macron */
03423        switch (base_glyph) {
03424        case 0x0041: /* A */ return 0x0100;
03425        case 0x0045: /* E */ return 0x0112;
03426        case 0x0049: /* I */ return 0x012A;
03427        case 0x004F: /* O */ return 0x014C;
03428        case 0x0055: /* U */ return 0x016A;
03429        case 0x0061: /* a */ return 0x0101;
03430        case 0x0065: /* e */ return 0x0113;
03431        case 0x0069: /* i */ return 0x012B;
03432        case 0x006D: /* m */ return 0x00AF;
03433        case 0x006F: /* o */ return 0x014D;
03434        case 0x0075: /* u */ return 0x016B;
03435        default: return 0;
03436        }
03437        /* special cases: accent - char inverted */
03438     case 0x0043: /* C; special case: cedilla is set after C in OT1 */
03439        switch (base_glyph) {
03440        case 0x00B8: /* cedilla */ return 0x00C7;
03441        default: return 0;
03442        }
03443     case 0x0063: /* c; see above */
03444        switch (base_glyph) {
03445        case 0x00B8: /* cedilla */ return 0x00E7;
03446        default: return 0;
03447        }
03448     case 0x0053: /* S; see above */
03449        switch (base_glyph) {
03450        case 0x00B8: /* cedilla */ return 0x015E;
03451        default: return 0;
03452        }
03453     case 0x0073: /* s; see above */
03454        switch (base_glyph) {
03455        case 0x00B8: /* cedilla */ return 0x015F;
03456        default: return 0;
03457        }
03458     }
03459     return 0;
03460 }
03461 
03462 uint32_t
03463 guess_encoding(wide_ubyte ch, const char *fontname, char *retbuf)
03464 {
03465     uint32_t i;
03466     static hashTableT unknown_font_hash;
03467     static Boolean hash_initialized = False;
03468     size_t dummy = 0;
03469     
03470     TRACE_FIND_VERBOSE((stderr, "guess_encoding: |%s|, char 0x%.4X", fontname, ch));
03471 
03472     /* our encoding vectors only have size 256 */
03473     if (ch > 255) {
03474        XDVI_WARNING((stderr, "guess_encoding: font index %lu too large", (unsigned long)ch));
03475        return 0;
03476     }
03477 
03478     if (memcmp(fontname, "gbk", 3) == 0
03479               && isdigit((int)fontname[(i=strlen(fontname))-1])
03480               && isdigit((int)fontname[i-2])) {
03481 #if HAVE_ICONV_H
03482        unsigned char cjk[2];
03483        TRACE_FIND_VERBOSE((stderr, "guess_encoding: CJK fonts (GBK encoding)"));
03484        i = atoi(fontname + i - 2);        /* font no */
03485        i = (i - 1) * 256 + (uint32_t)ch;  /* char index */
03486        cjk[0] = i / 190 + 129;
03487        cjk[1] = i % 190 + 64;
03488        if (cjk[1] >= 128)
03489            cjk[1]++;
03490        return cjk2unicode(cjk);
03491 #else /* HAVE_ICONV_H */
03492        if (!warned_about_cjk) {
03493            popup_message(globals.widgets.top_level,
03494                        MSG_WARN, NULL, "This version of xdvi has been compiled without iconv support - "
03495                        "cannot convert CJK character to UTF-8");
03496            warned_about_cjk = True;
03497        }
03498        return 0;
03499 #endif /* HAVE_ICONV_H */
03500     }
03501 
03502     if (memcmp(fontname, "cmsy", 4) == 0) {
03503        TRACE_FIND_VERBOSE((stderr, "guess_encoding: %s => m_cm_symbol", fontname));
03504        return m_cm_symbol_encoding[ch];
03505     }
03506     if (memcmp(fontname, "cmmi", 4) == 0) {
03507        TRACE_FIND_VERBOSE((stderr, "guess_encoding: %s => m_cm_math_italics", fontname));
03508        return m_cm_math_italics_encoding[ch];
03509     }
03510     if (memcmp(fontname, "cmex", 4) == 0) {
03511        TRACE_FIND_VERBOSE((stderr, "guess_encoding: %s => m_cm_math_extended", fontname));
03512        return m_cm_math_extended_encoding[ch];
03513     }
03514     if (memcmp(fontname, "cmtt", 4) == 0) {
03515        TRACE_FIND_VERBOSE((stderr, "guess_encoding: %s => m_cm_typewriter", fontname));
03516        return m_cm_typewriter_encoding[ch];
03517     }
03518     /* following to cover cmsl, cmb, cmbx, cmti, cmdunghill, whatever ...
03519        hope it doesn't overgenerate ;-) */
03520     if (memcmp(fontname, "cm", 2) == 0
03521        || memcmp(fontname, "lcmss", strlen("lcmss")) == 0 /* lcmss8 etc. */
03522        || memcmp(fontname, "ygoth", strlen("ygoth")) == 0
03523        || memcmp(fontname, "yinit", strlen("yinit")) == 0
03524        || memcmp(fontname, "logo", strlen("logo")) == 0
03525        || memcmp(fontname, "rsfs", strlen("rsfs")) == 0
03526        ) {
03527        TRACE_FIND_VERBOSE((stderr, "guess_encoding: %s => m_ot1", fontname));
03528        return m_ot1_encoding[ch];
03529     }
03530     /* cyrillic fonts */
03531     if (memcmp(fontname, "la", 2) == 0) {
03532        TRACE_FIND_VERBOSE((stderr, "guess_encoding: %s => m_t2", fontname));
03533        return m_t2_encoding[ch];
03534     }
03535     if (memcmp(fontname, "ec", 2) == 0
03536        || memcmp(fontname, "eb", 2) == 0) {
03537        TRACE_FIND_VERBOSE((stderr, "guess_encoding: %s => m_cork", fontname));
03538        /* FIXME: why cork and not EC? What font actually uses EC?
03539           The only difference seems that dvips' EC.enc has `ldot' at 0xb8,
03540           whereas cork.enc has `ydieresis' there. A document with
03541           \usepackage[T1]{fontenc}
03542           also produces a ydieresis.
03543         */
03544        return m_cork_encoding[ch];
03545     }
03546     if (memcmp(fontname, "tc", 2) == 0) {
03547        TRACE_FIND_VERBOSE((stderr, "guess_encoding: %s => m_ts1", fontname));
03548        return m_ts1_encoding[ch];
03549     }
03550     /* blackletter fonts with funny encoding */
03551     if (memcmp(fontname, "ysmfrak", 7) == 0
03552        || memcmp(fontname, "yswab", 5) == 0) {
03553        TRACE_FIND_VERBOSE((stderr, "guess_encoding: %s => m_yfrak", fontname));
03554        /* special cases for ligatures */
03555        switch (ch) {
03556        case 0x85: strcpy(retbuf, "ch"); return 0;
03557        case 0x86: strcpy(retbuf, "ck"); return 0;
03558        case 0xA7: strcpy(retbuf, "sz"); return 0;
03559        default: return m_yfrak_encoding[ch];
03560        }
03561     }
03562 
03563     /* euler mathematical */
03564     if (memcmp(fontname, "eufm", strlen("eufm")) == 0
03565        || memcmp(fontname, "eusm", strlen("eufm")) == 0
03566        ) {
03567        switch (ch) {
03568        case 0x0: case 0x1: return 'd'; break;
03569        case 0x2: case 0x3: return 'f'; break;
03570        case 0x4: return 'g'; break;
03571        case 0x5: return 'k'; break;
03572        case 0x6: return 't'; break;
03573        case 0x7: return 'u'; break;
03574        default: return m_ot1_encoding[ch];
03575        }
03576     }
03577               
03578     
03579     /* stuff that doesn't have a good ASCII representation */
03580     if (memcmp(fontname, "lcircle", strlen("lcircle")) == 0
03581        || memcmp(fontname, "line", strlen("line")) == 0
03582        || memcmp(fontname, "fmvr8x", strlen("fmvr8x")) == 0
03583        || memcmp(fontname, "feymr", strlen("feymr")) == 0
03584        || memcmp(fontname, "msbm", strlen("msbm")) == 0
03585        || memcmp(fontname, "msam", strlen("msam")) == 0
03586        || memcmp(fontname, "wasy", strlen("wasy")) == 0
03587        || memcmp(fontname, "txsy", strlen("txsy")) == 0
03588        ) {
03589        return 0;
03590     }
03591 
03592     /* TODO:
03593        txfonts
03594     */
03595     
03596     /* default: assume cork encoding, and print out a warning for each font */
03597     if (!hash_initialized) {
03598        unknown_font_hash = hash_create(1031);
03599        hash_initialized = True;
03600     }
03601     if (!find_str_int_hash(&unknown_font_hash, fontname, &dummy)) {
03602        XDVI_WARNING((stderr,
03603                     "guess_encoding(): nothing suitable for \"%s\", assuming Cork encoding.\n"
03604                     "(Please tell us about this at "
03605                     "http://sourceforge.net/tracker/?group_id=23164&atid=377580)", fontname));
03606        put_str_int_hash(&unknown_font_hash, fontname, dummy);
03607     }
03608     return m_cork_encoding[ch];
03609 }
03610 
03611 /*
03612   Mapping of unicode glyphs to ASCII `equivalents'
03613   that are useful when searching for text.
03614 */
03615 const char *
03616 search_normalize_chars(uint32_t unicode)
03617 {
03618     const char *ret = NULL;
03619     switch(unicode) {
03620     case 0x2212: ret = "-"; break;
03621     case 0x2022: ret = "\xb7";     break; /* middle dot */
03622     default: ret = NULL;    break;
03623     }
03624     if (ret != NULL) {
03625         TRACE_FIND((stderr, "expand_searchchars: 0x%X --> `%s'",
03626                     (unsigned int)unicode, ret));
03627     }
03628     return ret;
03629 }
03630 
03631 /*
03632   Expand a unicode ligature character consisting of several
03633   `ordinary' characters to a string of those characters, and
03634   map some unicode glyphs to ASCII `equivalents'.
03635   
03636   TODO: move the more ambiguous replacements (e.g.
03637   guilsinglleft vs. angleleft) into a user-defined table?
03638 */
03639 const char *
03640 expand_ligature(uint32_t unicode)
03641 {
03642     const char *ret = NULL;
03643     switch(unicode) {
03644     case 0xFB00: ret = "ff";       break;
03645     case 0xFB01: ret = "fi";       break;
03646     case 0xFB02: ret = "fl";       break;
03647     case 0xFB03: ret = "ffi";      break;
03648     case 0xFB04: ret = "ffl";      break;
03649     case 0xFB06: ret = "st";       break;
03650     case 0x0133: ret = "ij";       break;
03651     case 0x2013: ret = "--";       break;
03652     case 0x2014: ret = "---";      break;
03653     case 0x2039:
03654     case 0x2329: ret = "<"; break;
03655     case 0x203A:
03656     case 0x232A: ret = ">"; break;
03657     case 0x2018: ret = "`"; break;
03658     case 0x2019: ret = "'"; break;
03659     case 0x201C: ret = "``";       break;
03660     case 0x201D: ret = "''";       break;
03661     case 0x2026: ret = "...";      break;
03662     case 0x10ff28: ret = "{";      break;
03663     case 0x10ff29: ret = "}";      break;
03664     default: ret = NULL;    break;
03665     }
03666     if (ret != NULL) {
03667         TRACE_FIND((stderr, "expand_ligature: 0x%X --> `%s'",
03668                     (unsigned int)unicode, ret));
03669     }
03670     return ret;
03671 }
03672 
03673 /*
03674  * Convert the utf8-string passed as argument to lowercase, by
03675  * first converting to UCS4, then converting back, lowercasing the
03676  * UCS4 characters as we go (it's easier like that).
03677  */
03678 Boolean
03679 utf8_lowercase(char *utf8)
03680 {
03681     size_t utf8_len = strlen(utf8) + 1; /* also convert terminating byte (acutally not needed ...) */
03682     size_t ucs4_len = utf8_len * 6; /* ample ... */
03683     int i = 0;
03684     uint32_t *ucs4 = xmalloc(ucs4_len);
03685     uint32_t *ucs4_start = ucs4; /* save for free()ing */
03686     for (; *utf8 != '\0'; ucs4++, utf8 += i) {
03687        size_t conv_len;
03688        if ((i = utf8_to_ucs4(utf8, ucs4, 6 /* don't care about character len */)) < 0) {
03689            XDVI_ERROR((stderr, "Error in utf8_lowercase: Illegal UTF-8 sequence"));
03690            free(ucs4_start);
03691            return False;
03692        }
03693        ucs4_to_utf8(*ucs4, utf8, &conv_len, True); /* lowercases it */
03694        if ((int)conv_len != i) {
03695            XDVI_ERROR((stderr, "Error in utf8_lowercase: length after UCS4 conversion (%lu)\n"
03696                      "differs from length after utf8 conversion(%lu) (string: %s)\n",
03697                      (unsigned long)conv_len, (unsigned long)i, utf8));
03698            free(ucs4_start);
03699            return False;
03700        }
03701     }
03702     free(ucs4_start);
03703     return True;
03704 }
03705 
03706 /*
03707  * Adapted from iconv's utf8_wctomb in lib/utf8.h
03708  * Converts the character sequence pointed to by utf8 of maximum length `len'
03709  * into an UCS4 character pointed to by ucs4.
03710  * TODO: maybe implement this as a macro??
03711  */
03712 int
03713 utf8_to_ucs4(const char *utf8, uint32_t *ucs4, size_t len)
03714 {
03715     const unsigned char *str = (const unsigned char *)utf8;
03716     unsigned char c = *str;
03717 
03718     if (c < 0x80) {
03719        *ucs4 = c;
03720        return 1;
03721     }
03722     else if (c < 0xc2) {
03723        return -1; /* illegal UTF8; shouldn't happen */
03724     }
03725     else if (c < 0xe0) {
03726        if (len < 2)
03727            return -1; /* len too short */
03728        if (!((str[1] ^ 0x80) < 0x40)) {
03729            return -1; /* illegal UTF8; shouldn't happen */
03730        }
03731        *ucs4 = ((uint32_t) (c & 0x1f) << 6)
03732            | (uint32_t) (str[1] ^ 0x80);
03733        return 2;
03734     }
03735     else if (c < 0xf0) {
03736        if (len < 3)
03737            return -1; /* len too short */
03738        if (!((str[1] ^ 0x80) < 0x40
03739              && (str[2] ^ 0x80) < 0x40
03740              && (c >= 0xe1 || str[1] >= 0xa0))) {
03741            return -1; /* illegal UTF8; shouldn't happen */
03742        }
03743        *ucs4 = ((uint32_t) (c & 0x0f) << 12)
03744            | ((uint32_t) (str[1] ^ 0x80) << 6)
03745            | (uint32_t) (str[2] ^ 0x80);
03746        return 3;
03747     }
03748     else if (c < 0xf8 && sizeof(uint32_t) * 8 >= 32) {
03749        if (len < 4)
03750            return -1; /* len too short */
03751        if (!((str[1] ^ 0x80) < 0x40
03752              && (str[2] ^ 0x80) < 0x40
03753              && (str[3] ^ 0x80) < 0x40
03754              && (c >= 0xf1 || str[1] >= 0x90))) {
03755            return -1; /* illegal UTF8; shouldn't happen */
03756        }
03757        *ucs4 = ((uint32_t) (c & 0x07) << 18)
03758            | ((uint32_t) (str[1] ^ 0x80) << 12)
03759            | ((uint32_t) (str[2] ^ 0x80) << 6)
03760            | (uint32_t) (str[3] ^ 0x80);
03761        return 4;
03762     }
03763     else if (c < 0xfc && sizeof(uint32_t)*8 >= 32) {
03764        if (len < 5)
03765            return -1; /* len too short */
03766        if (!((str[1] ^ 0x80) < 0x40
03767              && (str[2] ^ 0x80) < 0x40
03768              && (str[3] ^ 0x80) < 0x40
03769              && (str[4] ^ 0x80) < 0x40
03770              && (c >= 0xf9 || str[1] >= 0x88))) {
03771            return -1; /* illegal UTF8; shouldn't happen */
03772        }
03773        *ucs4 = ((uint32_t) (c & 0x03) << 24)
03774            | ((uint32_t) (str[1] ^ 0x80) << 18)
03775            | ((uint32_t) (str[2] ^ 0x80) << 12)
03776            | ((uint32_t) (str[3] ^ 0x80) << 6)
03777            | (uint32_t) (str[4] ^ 0x80);
03778        return 5;
03779     }
03780     else if (c < 0xfe && sizeof(uint32_t)*8 >= 32) {
03781        if (len < 6)
03782            return -1; /* len too short */
03783        if (!((str[1] ^ 0x80) < 0x40
03784              && (str[2] ^ 0x80) < 0x40
03785              && (str[3] ^ 0x80) < 0x40
03786              && (str[4] ^ 0x80) < 0x40
03787              && (str[5] ^ 0x80) < 0x40
03788              && (c >= 0xfd || str[1] >= 0x84))) {
03789            return -1; /* illegal UTF8; shouldn't happen */
03790        }
03791        *ucs4 = ((uint32_t) (c & 0x01) << 30)
03792            | ((uint32_t) (str[1] ^ 0x80) << 24)
03793            | ((uint32_t) (str[2] ^ 0x80) << 18)
03794            | ((uint32_t) (str[3] ^ 0x80) << 12)
03795            | ((uint32_t) (str[4] ^ 0x80) << 6)
03796            | (uint32_t) (str[5] ^ 0x80);
03797        return 6;
03798     }
03799     else {
03800        return -1; /* illegal UTF8 */
03801     }
03802 }
03803 
03804 /* adapted from iconv's utf8_wctomb in lib/utf8.h */
03805 /* TODO: maybe implement this as a macro?? */
03806 void
03807 ucs4_to_utf8(uint32_t ucs4, char *utf8, size_t *len, Boolean do_lowercase)
03808 {
03809     if (do_lowercase)
03810        ucs4 = ucs4_lowercase(ucs4);
03811     
03812     if (ucs4 < 0x80)
03813        *len = 1;
03814     else if (ucs4 < 0x800)
03815        *len = 2;
03816     else if (ucs4 < 0x10000)
03817        *len = 3;
03818     else if (ucs4 < 0x200000)
03819        *len = 4;
03820     else if (ucs4 < 0x4000000)
03821        *len = 5;
03822     else if (ucs4 <= 0x7fffffff)
03823        *len = 6;
03824 
03825     switch(*len) { /* note: code falls through cases! */
03826     case 6: utf8[5] = 0x80 | (ucs4 & 0x3f); ucs4 = ucs4 >> 6; ucs4 |= 0x4000000;
03827     case 5: utf8[4] = 0x80 | (ucs4 & 0x3f); ucs4 = ucs4 >> 6; ucs4 |= 0x200000;
03828     case 4: utf8[3] = 0x80 | (ucs4 & 0x3f); ucs4 = ucs4 >> 6; ucs4 |= 0x10000;
03829     case 3: utf8[2] = 0x80 | (ucs4 & 0x3f); ucs4 = ucs4 >> 6; ucs4 |= 0x800;
03830     case 2: utf8[1] = 0x80 | (ucs4 & 0x3f); ucs4 = ucs4 >> 6; ucs4 |= 0xc0;
03831     case 1: utf8[0] = ucs4;
03832     }
03833 }
03834 
03835 
03836 
03837 /*
03838  * (Lossy) conversion of utf8 sequence to an iso-latin1; produces
03839  * `?' if the character is not representable in iso-latin1.
03840  * Returns the number of converted characters in `len'.
03841  */
03842 unsigned char
03843 utf8_to_iso_8859_1(const char *utf8, size_t *len)
03844 {
03845     unsigned char c = *utf8;
03846     uint32_t wc;
03847 
03848     if (c < 0x80) {
03849        *len = 1;
03850        return c;
03851     }
03852     else if (c < 0xe0) {
03853        *len = 2;
03854        wc = ((unsigned char)(c & 0x1f) << 6) | (unsigned char)(utf8[1] ^ 0x80);
03855        if (wc <= 0xff)
03856            return (unsigned char)wc;
03857        else
03858            return '?';
03859     }
03860     else if (c < 0xf0) {
03861        *len = 3;
03862        return '?';
03863     }
03864     else if (c < 0xf8) {
03865        *len = 4;
03866        return '?';
03867     }
03868     else if (c < 0xfc) {
03869        *len = 5;
03870        return '?';
03871     }
03872     else if (c < 0xfe) {
03873        *len = 6;
03874        return '?';
03875     }
03876     else
03877        return '?';
03878 }
03879 
03880 /* convert an iso_8859_1 character to utf8, writing the result
03881    to the buffer `utf8' (which should have at least length 2),
03882    and storing the length of the converted utf-8 sequence in *len.
03883 */
03884 void
03885 iso_8859_1_to_utf8(unsigned char c, char *utf8, size_t *len)
03886 {
03887     if (c < 0x80) {
03888        *len = 1;
03889        utf8[0] = c;
03890     }
03891     else {
03892        *len = 2;
03893        utf8[1] = 0x80 | (c & 0x3f);
03894        c >>= 6;
03895        utf8[0] = 0xc0 | (c & 0x1f);
03896     }
03897 }
03898 
03899 /* Convert an iso_latin-1 string to a UTF-8 string (including the
03900    terminating `\0'), not writing more than `len' characters to
03901    `utf8'. Returns the number of written characters, or -1 if len was
03902    too small to convert the entire input string.
03903 */
03904 int
03905 str_iso_8859_1_to_utf8(const char *latin1, char *utf8, size_t len)
03906 {
03907     size_t i = 0;
03908 
03909     while (i < len && *latin1 != '\0') {
03910        char tmpbuf[2];
03911        size_t tmp_len = 0;
03912        iso_8859_1_to_utf8((unsigned char)*latin1, tmpbuf, &tmp_len);
03913        if (i + tmp_len >= len)
03914            return -1;
03915        memcpy(utf8 + i, tmpbuf, tmp_len);
03916        i += tmp_len;
03917        latin1++;
03918     }
03919     /* terminate utf8 */
03920     if (i < len)
03921        utf8[i++] = '\0';
03922     else
03923        return -1;
03924     
03925     return i;
03926 }
03927 
03928 Boolean
03929 is_hyphenchar(uint32_t u)
03930 {
03931     if (u == 0x002D || u ==  0x00AD)
03932        return True;
03933     return False;
03934 }
03935 
03936 /*
03937  * Determine ideographic property according to
03938  * http://www.unicode.org/Public/UNIDATA/PropList.txt:
03939  * 
03940  * 3006          ; Ideographic # Lo       IDEOGRAPHIC CLOSING MARK
03941  * 3007          ; Ideographic # Nl       IDEOGRAPHIC NUMBER ZERO
03942  * 3021..3029    ; Ideographic # Nl   [9] HANGZHOU NUMERAL ONE..HANGZHOU NUMERAL NINE
03943  * 3038..303A    ; Ideographic # Nl   [3] HANGZHOU NUMERAL TEN..HANGZHOU NUMERAL THIRTY
03944  * 3400..4DB5    ; Ideographic # Lo [6582] CJK UNIFIED IDEOGRAPH-3400..CJK UNIFIED IDEOGRAPH-4DB5
03945  * 4E00..9FA5    ; Ideographic # Lo [20902] CJK UNIFIED IDEOGRAPH-4E00..CJK UNIFIED IDEOGRAPH-9FA5
03946  * F900..FA2D    ; Ideographic # Lo [302] CJK COMPATIBILITY IDEOGRAPH-F900..CJK COMPATIBILITY IDEOGRAPH-FA2D
03947  * 20000..2A6D6  ; Ideographic # Lo [42711] CJK UNIFIED IDEOGRAPH-20000..CJK UNIFIED IDEOGRAPH-2A6D6
03948  * 2F800..2FA1D  ; Ideographic # Lo [542] CJK COMPATIBILITY IDEOGRAPH-2F800..CJK COMPATIBILITY IDEOGRAPH-2FA1D
03949  * 
03950  * # Total code points: 71053
03951  *
03952  * plus space, comma and full stop.
03953  *
03954  */
03955 Boolean
03956 is_ideograph(uint32_t u)
03957 {
03958     return (u >= 0x3000 && u <= 0x3002) || /* IDEOGRAPHIC SPACE, COMMA, FULL STOP */
03959        u == 0xFF61 || /* HALFWIDTH IDEOGRAPHIC FULL STOP */
03960        u == 0xFF64 || /* HALFWIDTH IDEOGRAPHIC COMMA */
03961        (u >= 0x3006 && u <= 0x3007) ||
03962        (u >= 0x3021 && u <= 0x3029) ||
03963        (u >= 0x3038 && u <= 0x303A) ||
03964        (u >= 0x3400 && u <= 0x4DB5) ||
03965        (u >= 0x4E00 && u <= 0x9FA5) ||
03966        (u >= 0xF900 && u <= 0xFA2D) ||
03967        (u >= 0x20000 && u <= 0x2A6D6) ||
03968        (u >= 0x2F800 && u <= 0x2FA1D);
03969 }
03970 
03971 char *
03972 str_utf8_to_iso_8859_1(const char *utf8)
03973 {
03974     size_t utf8_len = strlen(utf8), i = 0, offset = 0;
03975     char *buf = xmalloc(4 * utf8_len + 1); /* worst case of non-printables */
03976 
03977     while (i < utf8_len) {
03978        uint32_t ucs4;
03979        const char *ret;
03980 
03981        /*  fprintf(stderr, "offset: %d\n", (int)offset); */
03982        /* first apply normalization heurisitcs also used by search */
03983        size_t len = utf8_to_ucs4(utf8 + i, &ucs4, utf8_len + 1);
03984        if ((ret = search_normalize_chars(ucs4)) != NULL) {
03985            size_t len_ret = strlen(ret);
03986            memcpy(buf + offset, ret, len_ret);
03987            offset += len_ret;
03988        }
03989        else if (ucs4 <= 0xff) { /* in iso-latin1 range */
03990            buf[offset++] = (unsigned char)ucs4;
03991        }
03992        else {
03993            sprintf(buf + offset, "\\%.4lX", (unsigned long)ucs4);
03994            offset += 4;
03995        }
03996        i += len;
03997     }
03998     buf[offset] = '\0';
03999     
04000     return buf;
04001 }