iconvdata/iso-2022-jp.c

   1 /* Conversion module for ISO-2022-JP.
   2    Copyright (C) 1998, 1999 Free Software Foundation, Inc.
   3    This file is part of the GNU C Library.
   4    Contributed by Ulrich Drepper <drepper@cygnus.com>, 1998.
   5
   6    The GNU C Library is free software; you can redistribute it and/or
   7    modify it under the terms of the GNU Library General Public License as
   8    published by the Free Software Foundation; either version 2 of the
   9    License, or (at your option) any later version.
  10
  11    The GNU C Library is distributed in the hope that it will be useful,
  12    but WITHOUT ANY WARRANTY; without even the implied warranty of
  13    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
  14    Library General Public License for more details.
  15
  16    You should have received a copy of the GNU Library General Public
  17    License along with the GNU C Library; see the file COPYING.LIB.  If not,
  18    write to the Free Software Foundation, Inc., 59 Temple Place - Suite 330,
  19    Boston, MA 02111-1307, USA.  */
  20
  21 #include <gconv.h>
  22 #include <stdint.h>
  23 #include <stdlib.h>
  24 #include <string.h>
  25 #include "jis0201.h"
  26 #include "jis0208.h"
  27 #include "jis0212.h"
  28 #include "gb2312.h"
  29 #include "ksc5601.h"
  30
  31 struct gap
  32 {
  33   uint16_t start;
  34   uint16_t end;
  35   int32_t idx;
  36 };
  37
  38 #include "iso8859-7jp.h"
  39
  40 /* This makes obvious what everybody knows: 0x1b is the Esc character.  */
  41 #define ESC 0x1b
  42
  43 /* We provide our own initialization and destructor function.  */
  44 #define DEFINE_INIT     0
  45 #define DEFINE_FINI     0
  46
  47 /* Definitions used in the body of the `gconv' function.  */
  48 #define FROM_LOOP               from_iso2022jp_loop
  49 #define TO_LOOP                 to_iso2022jp_loop
  50 #define MIN_NEEDED_FROM         1
  51 #define MAX_NEEDED_FROM         4
  52 #define MIN_NEEDED_TO           4
  53 #define MAX_NEEDED_TO           4
  54 #define FROM_DIRECTION          (dir == from_iso2022jp)
  55 #define PREPARE_LOOP \
  56   enum direction dir = ((struct iso2022jp_data *) step->data)->dir;           \
  57   enum variant var = ((struct iso2022jp_data *) step->data)->var;             \
  58   int save_set;                                                               \
  59   int *setp = &data->statep->count;
  60 #define EXTRA_LOOP_ARGS         , var, setp
  61
  62
  63 /* Direction of the transformation.  */
  64 enum direction
  65 {
  66   illegal_dir,
  67   to_iso2022jp,
  68   from_iso2022jp
  69 };
  70
  71 /* We handle ISO-2022-jp and ISO-2022-JP-2 here.  */
  72 enum variant
  73 {
  74   illegal_var,
  75   iso2022jp,
  76   iso2022jp2
  77 };
  78
  79
  80 struct iso2022jp_data
  81 {
  82   enum direction dir;
  83   enum variant var;
  84 };
  85
  86
  87 /* The COUNT element of the state keeps track of the currently selected
  88    character set.  The possible values are:  */
  89 enum
  90 {
  91   ASCII_set = 0,
  92   JISX0208_1978_set,
  93   JISX0208_1983_set,
  94   JISX0201_Roman_set,
  95   JISX0201_Kana_set,
  96   GB2312_set,
  97   KSC5601_set,
  98   JISX0212_set
  99 };
 100
 101 /* The second value stored is the designation of the G2 set.  The following
 102    values are possible:  */
 103 enum
 104 {
 105   UNSPECIFIED_set = 0,
 106   ISO88591_set,
 107   ISO88597_set
 108 };
 109
 110
 111 int
 112 gconv_init (struct gconv_step *step)
 113 {
 114   /* Determine which direction.  */
 115   struct iso2022jp_data *new_data;
 116   enum direction dir = illegal_dir;
 117   enum variant var = illegal_var;
 118   int result;
 119
 120   if (__strcasecmp (step->from_name, "ISO-2022-JP//") == 0)
 121     {
 122       dir = from_iso2022jp;
 123       var = iso2022jp;
 124     }
 125   else if (__strcasecmp (step->to_name, "ISO-2022-JP//") == 0)
 126     {
 127       dir = to_iso2022jp;
 128       var = iso2022jp;
 129     }
 130   else if (__strcasecmp (step->from_name, "ISO-2022-JP-2//") == 0)
 131     {
 132       dir = from_iso2022jp;
 133       var = iso2022jp2;
 134     }
 135   else if (__strcasecmp (step->to_name, "ISO-2022-JP-2//") == 0)
 136     {
 137       dir = to_iso2022jp;
 138       var = iso2022jp2;
 139     }
 140
 141   result = GCONV_NOCONV;
 142   if (dir != illegal_dir)
 143     {
 144       new_data
 145         = (struct iso2022jp_data *) malloc (sizeof (struct iso2022jp_data));
 146
 147       result = GCONV_NOMEM;
 148       if (new_data != NULL)
 149         {
 150           new_data->dir = dir;
 151           new_data->var = var;
 152           step->data = new_data;
 153
 154           if (dir == from_iso2022jp)
 155             {
 156               step->min_needed_from = MIN_NEEDED_FROM;
 157               step->max_needed_from = MAX_NEEDED_FROM;
 158               step->min_needed_to = MIN_NEEDED_TO;
 159               step->max_needed_to = MAX_NEEDED_TO;
 160             }
 161           else
 162             {
 163               step->min_needed_from = MIN_NEEDED_TO;
 164               step->max_needed_from = MAX_NEEDED_TO;
 165               step->min_needed_to = MIN_NEEDED_FROM;
 166               step->max_needed_to = MAX_NEEDED_FROM + 2;
 167             }
 168
 169           /* Yes, this is a stateful encoding.  */
 170           step->stateful = 1;
 171
 172           result = GCONV_OK;
 173         }
 174     }
 175
 176   return result;
 177 }
 178
 179
 180 void
 181 gconv_end (struct gconv_step *data)
 182 {
 183   free (data->data);
 184 }
 185
 186
 187 /* Since this is a stateful encoding we have to provide code which resets
 188    the output state to the initial state.  This has to be done during the
 189    flushing.  */
 190 #define EMIT_SHIFT_TO_INIT \
 191   if (data->statep->count != ASCII_set)                                       \
 192     {                                                                         \
 193       enum direction dir = ((struct iso2022jp_data *) step->data)->dir;       \
 194                                                                               \
 195       if (dir == from_iso2022jp)                                              \
 196         /* It's easy, we don't have to emit anything, we just reset the       \
 197            state for the input.  Note that this also clears the G2            \
 198            designation.  */                                                   \
 199         data->statep->count = ASCII_set;                                      \
 200       else                                                                    \
 201         {                                                                     \
 202           unsigned char *outbuf = data->outbuf;                               \
 203                                                                               \
 204           /* We are not in the initial state.  To switch back we have         \
 205              to emit the sequence `Esc ( B'.  */                              \
 206           if (outbuf + 3 > data->outbufend)                                   \
 207             /* We don't have enough room in the output buffer.  */            \
 208             status = GCONV_FULL_OUTPUT;                                       \
 209           else                                                                \
 210             {                                                                 \
 211               /* Write out the shift sequence.  */                            \
 212               *outbuf++ = ESC;                                                \
 213               *outbuf++ = '(';                                                \
 214               *outbuf++ = 'B';                                                \
 215               data->outbuf = outbuf;                                          \
 216               /* Note that this also clears the G2 designation.  */           \
 217               data->statep->count = ASCII_set;                                \
 218             }                                                                 \
 219         }                                                                     \
 220     }
 221
 222
 223 /* Since we might have to reset input pointer we must be able to save
 224    and retore the state.  */
 225 #define SAVE_RESET_STATE(Save) \
 226   if (Save)                                                                   \
 227     save_set = *setp;                                                         \
 228   else                                                                        \
 229     *setp = save_set
 230
 231
 232 /* First define the conversion function from ISO-2022-JP to UCS4.  */
 233 #define MIN_NEEDED_INPUT        MIN_NEEDED_FROM
 234 #define MAX_NEEDED_INPUT        MAX_NEEDED_FROM
 235 #define MIN_NEEDED_OUTPUT       MIN_NEEDED_TO
 236 #define LOOPFCT                 FROM_LOOP
 237 #define BODY \
 238   {                                                                           \
 239     uint32_t ch = *inptr;                                                     \
 240                                                                               \
 241     /* Recognize escape sequences.  */                                        \
 242     if (ch == ESC)                                                            \
 243       {                                                                       \
 244         /* We now must be prepared to read two to three more                  \
 245            chracters.  If we have a match in the first character but          \
 246            then the input buffer ends we terminate with an error since        \
 247            we must not risk missing an escape sequence just because it        \
 248            is not entirely in the current input buffer.  */                   \
 249         if (inptr + 2 >= inend                                                \
 250             || (var == iso2022jp2 && inptr[1] == '$' && inptr[2] == '('       \
 251                 && inptr + 3 >= inend))                                       \
 252           {                                                                   \
 253             /* Not enough input available.  */                                \
 254             result = GCONV_EMPTY_INPUT;                                       \
 255             break;                                                            \
 256           }                                                                   \
 257                                                                               \
 258         if (inptr[1] == '(')                                                  \
 259           {                                                                   \
 260             if (inptr[2] == 'B')                                              \
 261               {                                                               \
 262                 /* ASCII selected.  */                                        \
 263                 set = ASCII_set;                                              \
 264                 inptr += 3;                                                   \
 265                 continue;                                                     \
 266               }                                                               \
 267             else if (inptr[2] == 'J')                                         \
 268               {                                                               \
 269                 /* JIS X 0201 selected.  */                                   \
 270                 set = JISX0201_Roman_set;                                     \
 271                 inptr += 3;                                                   \
 272                 continue;                                                     \
 273               }                                                               \
 274             else if (var == iso2022jp2 && inptr[2] == 'I')                    \
 275               {                                                               \
 276                 /* JIS X 0201 selected.  */                                   \
 277                 set = JISX0201_Kana_set;                                      \
 278                 inptr += 3;                                                   \
 279                 continue;                                                     \
 280               }                                                               \
 281           }                                                                   \
 282         else if (inptr[1] == '$')                                             \
 283           {                                                                   \
 284             if (inptr[2] == '@')                                              \
 285               {                                                               \
 286                 /* JIS X 0208-1978 selected.  */                              \
 287                 set = JISX0208_1978_set;                                      \
 288                 inptr += 3;                                                   \
 289                 continue;                                                     \
 290               }                                                               \
 291             else if (inptr[2] == 'B')                                         \
 292               {                                                               \
 293                 /* JIS X 0208-1983 selected.  */                              \
 294                 set = JISX0208_1983_set;                                      \
 295                 inptr += 3;                                                   \
 296                 continue;                                                     \
 297               }                                                               \
 298             else if (var == iso2022jp2)                                       \
 299               {                                                               \
 300                 if (inptr[2] == 'A')                                          \
 301                   {                                                           \
 302                     /* GB 2312-1980 selected.  */                             \
 303                     set = GB2312_set;                                         \
 304                     inptr += 3;                                               \
 305                     continue;                                                 \
 306                   }                                                           \
 307                 else if (inptr[2] == '(')                                     \
 308                   {                                                           \
 309                     if (inptr[3] == 'C')                                      \
 310                       {                                                       \
 311                         /* KSC 5601-1987 selected.  */                        \
 312                         set = KSC5601_set;                                    \
 313                         inptr += 4;                                           \
 314                         continue;                                             \
 315                       }                                                       \
 316                     else if (inptr[3] == 'D')                                 \
 317                       {                                                       \
 318                         /* JIS X 0212-1990 selected.  */                      \
 319                         set = JISX0212_set;                                   \
 320                         inptr += 4;                                           \
 321                         continue;                                             \
 322                       }                                                       \
 323                   }                                                           \
 324               }                                                               \
 325           }                                                                   \
 326         else if (var == iso2022jp2 && inptr[1] == '.')                        \
 327           {                                                                   \
 328             if (inptr[2] == 'A')                                              \
 329               {                                                               \
 330                 /* ISO 8859-1-GR selected.  */                                \
 331                 set2 = ISO88591_set;                                          \
 332                 inptr += 3;                                                   \
 333                 continue;                                                     \
 334               }                                                               \
 335             else if (inptr[2] == 'F')                                         \
 336               {                                                               \
 337                 /* ISO 8859-7-GR selected.  */                                \
 338                 set2 = ISO88597_set;                                          \
 339                 inptr += 3;                                                   \
 340                 continue;                                                     \
 341               }                                                               \
 342           }                                                                   \
 343       }                                                                       \
 344                                                                               \
 345     if (ch == ESC && var == iso2022jp2 && inptr[1] == 'N')                    \
 346       {                                                                       \
 347         if (set2 == ISO88591_set)                                             \
 348           {                                                                   \
 349             ch = inptr[2] | 0x80;                                             \
 350             inptr += 3;                                                       \
 351           }                                                                   \
 352         else if (set2 == ISO88597_set)                                        \
 353           {                                                                   \
 354             /* We use the table from the ISO 8859-7 module.  */               \
 355             if (inptr[2] < 0x20 || inptr[2] > 0x80)                           \
 356               {                                                               \
 357                 result = GCONV_ILLEGAL_INPUT;                                 \
 358                 break;                                                        \
 359               }                                                               \
 360             ch = iso88597_to_ucs4[inptr[2] - 0x20];                           \
 361             if (ch == 0)                                                      \
 362               {                                                               \
 363                 result = GCONV_ILLEGAL_INPUT;                                 \
 364                 break;                                                        \
 365               }                                                               \
 366             inptr += 3;                                                       \
 367           }                                                                   \
 368         else                                                                  \
 369           {                                                                   \
 370             result = GCONV_ILLEGAL_INPUT;                                     \
 371             break;                                                            \
 372           }                                                                   \
 373       }                                                                       \
 374     else if (set == ASCII_set || (ch < 0x21 || ch == 0x7f))                   \
 375       /* Almost done, just advance the input pointer.  */                     \
 376       ++inptr;                                                                \
 377     else if (set == JISX0201_Roman_set)                                       \
 378       {                                                                       \
 379         /* Use the JIS X 0201 table.  */                                      \
 380         ch = jisx0201_to_ucs4 (ch);                                           \
 381         if (ch == UNKNOWN_10646_CHAR)                                         \
 382           {                                                                   \
 383             result = GCONV_ILLEGAL_INPUT;                                     \
 384             break;                                                            \
 385           }                                                                   \
 386         ++inptr;                                                              \
 387       }                                                                       \
 388     else if (set == JISX0201_Kana_set)                                        \
 389       {                                                                       \
 390         /* Use the JIS X 0201 table.  */                                      \
 391         ch = jisx0201_to_ucs4 (ch + 0x80);                                    \
 392         if (ch == UNKNOWN_10646_CHAR)                                         \
 393           {                                                                   \
 394             result = GCONV_ILLEGAL_INPUT;                                     \
 395             break;                                                            \
 396           }                                                                   \
 397         ++inptr;                                                              \
 398       }                                                                       \
 399     else                                                                      \
 400       {                                                                       \
 401         if (set == JISX0208_1978_set || set == JISX0208_1983_set)             \
 402           /* XXX I don't have the tables for these two old variants of        \
 403              JIS X 0208.  Therefore I'm using the tables for JIS X            \
 404              0208-1990.  If somebody has problems with this please            \
 405              provide the appropriate tables.  */                              \
 406           ch = jisx0208_to_ucs4 (&inptr,                                      \
 407                                  NEED_LENGTH_TEST ? inend - inptr : 2, 0);    \
 408         else if (set == JISX0212_set)                                         \
 409           /* Use the JIS X 0212 table.  */                                    \
 410           ch = jisx0212_to_ucs4 (&inptr,                                      \
 411                                  NEED_LENGTH_TEST ? inend - inptr : 2, 0);    \
 412         else if (set == GB2312_set)                                           \
 413           /* Use the GB 2312 table.  */                                       \
 414           ch = gb2312_to_ucs4 (&inptr,                                        \
 415                                NEED_LENGTH_TEST ? inend - inptr : 2, 0);      \
 416         else                                                                  \
 417           {                                                                   \
 418             assert (set == KSC5601_set);                                      \
 419                                                                               \
 420             /* Use the KSC 5601 table.  */                                    \
 421             ch = ksc5601_to_ucs4 (&inptr,                                     \
 422                                   NEED_LENGTH_TEST ? inend - inptr : 2, 0);   \
 423           }                                                                   \
 424                                                                               \
 425         if (NEED_LENGTH_TEST && ch == 0)                                      \
 426           {                                                                   \
 427             result = GCONV_EMPTY_INPUT;                                       \
 428             break;                                                            \
 429           }                                                                   \
 430         else if (ch == UNKNOWN_10646_CHAR)                                    \
 431           {                                                                   \
 432             result = GCONV_ILLEGAL_INPUT;                                     \
 433             break;                                                            \
 434           }                                                                   \
 435       }                                                                       \
 436                                                                               \
 437     *((uint32_t *) outptr)++ = ch;                                            \
 438   }
 439 #define EXTRA_LOOP_DECLS        , enum variant var, int *setp
 440 #define INIT_PARAMS             int set = *setp % 0x100, set2 = *setp / 0x100
 441 #define UPDATE_PARAMS           *setp = (set2 << 8) + set
 442 #include <iconv/loop.c>
 443
 444
 445 /* Next, define the other direction.  */
 446 #define MIN_NEEDED_INPUT        MIN_NEEDED_TO
 447 #define MIN_NEEDED_OUTPUT       MIN_NEEDED_FROM
 448 #define MAX_NEEDED_OUTPUT       (MAX_NEEDED_FROM + 2)
 449 #define LOOPFCT                 TO_LOOP
 450 #define BODY \
 451   {                                                                           \
 452     uint32_t ch;                                                              \
 453     size_t written = 0;                                                       \
 454                                                                               \
 455     ch = *((uint32_t *) inptr);                                               \
 456                                                                               \
 457     /* First see whether we can write the character using the currently       \
 458        selected character set.  */                                            \
 459     if (set == ASCII_set)                                                     \
 460       {                                                                       \
 461         /* Please note that the NUL byte is *not* matched if we are not       \
 462            currently using the ASCII charset.  This is because we must        \
 463            switch to the initial state whenever a NUL byte is written.  */    \
 464         if (ch <= 0x7f)                                                       \
 465           {                                                                   \
 466             *outptr++ = ch;                                                   \
 467             written = 1;                                                      \
 468           }                                                                   \
 469         /* At the beginning of a line, G2 designation is cleared.  */         \
 470         if (var == iso2022jp2 && ch == 0x0a)                                  \
 471           set2 = UNSPECIFIED_set;                                             \
 472       }                                                                       \
 473     else if (set == JISX0201_Roman_set)                                       \
 474       {                                                                       \
 475         unsigned char buf[2];                                                 \
 476         written = ucs4_to_jisx0201 (ch, buf);                                 \
 477         if (written != UNKNOWN_10646_CHAR && buf[0] > 0x20 && buf[0] < 0x80)  \
 478           {                                                                   \
 479             *outptr++ = buf[0];                                               \
 480             written = 1;                                                      \
 481           }                                                                   \
 482         else                                                                  \
 483           written = UNKNOWN_10646_CHAR;                                       \
 484       }                                                                       \
 485     else if (set == JISX0201_Kana_set)                                        \
 486       {                                                                       \
 487         unsigned char buf[2];                                                 \
 488         written = ucs4_to_jisx0201 (ch, buf);                                 \
 489         if (written != UNKNOWN_10646_CHAR && buf[0] > 0xa0 && buf[0] < 0xe0)  \
 490           {                                                                   \
 491             *outptr++ = buf[0] - 0x80;                                        \
 492             written = 1;                                                      \
 493           }                                                                   \
 494         else                                                                  \
 495           written = UNKNOWN_10646_CHAR;                                       \
 496       }                                                                       \
 497     else                                                                      \
 498       {                                                                       \
 499         if (set == JISX0208_1978_set || set == JISX0208_1983_set)             \
 500           written = ucs4_to_jisx0208 (ch, outptr,                             \
 501                                       (NEED_LENGTH_TEST                       \
 502                                        ? outend - outptr : 2));               \
 503         else if (set == JISX0212_set)                                         \
 504           written = ucs4_to_jisx0212 (ch, outptr,                             \
 505                                       (NEED_LENGTH_TEST                       \
 506                                        ? outend - outptr : 2));               \
 507         else if (set == GB2312_set)                                           \
 508           written = ucs4_to_gb2312 (ch, outptr, (NEED_LENGTH_TEST             \
 509                                                  ? outend - outptr : 2));     \
 510         else                                                                  \
 511           {                                                                   \
 512             assert (set == KSC5601_set);                                      \
 513                                                                               \
 514             written = ucs4_to_ksc5601 (ch, outptr,                            \
 515                                        (NEED_LENGTH_TEST                      \
 516                                         ? outend - outptr : 2));              \
 517           }                                                                   \
 518                                                                               \
 519         if (NEED_LENGTH_TEST && written == 0)                                 \
 520           {                                                                   \
 521             result = GCONV_FULL_OUTPUT;                                       \
 522             break;                                                            \
 523           }                                                                   \
 524         else if (written != UNKNOWN_10646_CHAR)                               \
 525           outptr += written;                                                  \
 526       }                                                                       \
 527                                                                               \
 528     if (written == UNKNOWN_10646_CHAR || written == 0)                        \
 529       {                                                                       \
 530         if (set2 == ISO88591_set)                                             \
 531           {                                                                   \
 532             if (ch >= 0x80 && ch <= 0xff)                                     \
 533               {                                                               \
 534                 *outptr++ = ESC;                                              \
 535                 *outptr++ = 'N';                                              \
 536                 *outptr++ = ch & 0x7f;                                        \
 537                 written = 3;                                                  \
 538               }                                                               \
 539           }                                                                   \
 540         else if (set2 == ISO88597_set)                                        \
 541           {                                                                   \
 542             const struct gap *rp = from_idx;                                  \
 543                                                                               \
 544             while (ch > rp->end)                                              \
 545               ++rp;                                                           \
 546             if (ch >= rp->start)                                              \
 547               {                                                               \
 548                 unsigned char res = iso88597_from_ucs4[ch - 0xa0 + rp->idx];  \
 549                 if (res != '\0')                                              \
 550                   {                                                           \
 551                     *outptr++ = ESC;                                          \
 552                     *outptr++ = 'N';                                          \
 553                     *outptr++ = res;                                          \
 554                     written = 3;                                              \
 555                   }                                                           \
 556               }                                                               \
 557           }                                                                   \
 558       }                                                                       \
 559                                                                               \
 560     if (written == UNKNOWN_10646_CHAR || written == 0)                        \
 561       {                                                                       \
 562         /* Either this is an unknown character or we have to switch           \
 563            the currently selected character set.  The character sets          \
 564            do not code entirely separate parts of ISO 10646 and               \
 565            therefore there is no single correct result.  If we choose         \
 566            the character set to use wrong we might be end up with             \
 567            using yet another character set for the next character             \
 568            though the current and the next could be encoded with one          \
 569            character set.  We leave this kind of optimization for             \
 570            later and now simply use a fixed order in which we test for        \
 571            availability  */                                                   \
 572                                                                               \
 573         if (ch <= 0x7f)                                                       \
 574           {                                                                   \
 575             /* We must encode using ASCII.  First write out the               \
 576                escape sequence.  */                                           \
 577             if (NEED_LENGTH_TEST && outptr + 4 > outend)                      \
 578               {                                                               \
 579                 result = GCONV_FULL_OUTPUT;                                   \
 580                 break;                                                        \
 581               }                                                               \
 582                                                                               \
 583             *outptr++ = ESC;                                                  \
 584             *outptr++ = '(';                                                  \
 585             *outptr++ = 'B';                                                  \
 586             set = ASCII_set;                                                  \
 587             *outptr++ = ch;                                                   \
 588                                                                               \
 589             /* At the beginning of a line, G2 designation is cleared.  */     \
 590             if (var == iso2022jp2 && ch == 0x0a)                              \
 591               set2 = UNSPECIFIED_set;                                         \
 592           }                                                                   \
 593         else                                                                  \
 594           {                                                                   \
 595             /* Now it becomes difficult.  We must search the other            \
 596                character sets one by one and we cannot use simple             \
 597                arithmetic to determine whether the character can be           \
 598                encoded using this set.  */                                    \
 599             size_t written;                                                   \
 600             unsigned char buf[2];                                             \
 601                                                                               \
 602             written = ucs4_to_jisx0201 (ch, buf);                             \
 603             if (written != UNKNOWN_10646_CHAR && buf[0] < 0x80)               \
 604               {                                                               \
 605                 /* We use JIS X 0201.  */                                     \
 606                 if (NEED_LENGTH_TEST && outptr + 4 > outend)                  \
 607                   {                                                           \
 608                     result = GCONV_FULL_OUTPUT;                               \
 609                     break;                                                    \
 610                   }                                                           \
 611                                                                               \
 612                 *outptr++ = ESC;                                              \
 613                 *outptr++ = '(';                                              \
 614                 *outptr++ = 'J';                                              \
 615                 set = JISX0201_Roman_set;                                     \
 616                 *outptr++ = buf[0];                                           \
 617               }                                                               \
 618             else                                                              \
 619               {                                                               \
 620                 written = ucs4_to_jisx0208 (ch, buf, 2);                      \
 621                 if (written != UNKNOWN_10646_CHAR)                            \
 622                   {                                                           \
 623                     /* We use JIS X 0208.  */                                 \
 624                     if (NEED_LENGTH_TEST && outptr + 5 > outend)              \
 625                       {                                                       \
 626                         result = GCONV_FULL_OUTPUT;                           \
 627                         break;                                                \
 628                       }                                                       \
 629                                                                               \
 630                     *outptr++ = ESC;                                          \
 631                     *outptr++ = '$';                                          \
 632                     *outptr++ = 'B';                                          \
 633                     set = JISX0208_1983_set;                                  \
 634                     *outptr++ = buf[0];                                       \
 635                     *outptr++ = buf[1];                                       \
 636                   }                                                           \
 637                 else if (var == iso2022jp)                                    \
 638                   {                                                           \
 639                     /* We have no other choice.  */                           \
 640                     result = GCONV_ILLEGAL_INPUT;                             \
 641                     break;                                                    \
 642                   }                                                           \
 643                 else                                                          \
 644                   {                                                           \
 645                     written = ucs4_to_jisx0212 (ch, buf, 2);                  \
 646                     if (written != UNKNOWN_10646_CHAR)                        \
 647                       {                                                       \
 648                         /* We use JIS X 0212.  */                             \
 649                         if (NEED_LENGTH_TEST && outptr + 6 > outend)          \
 650                           {                                                   \
 651                             result = GCONV_FULL_OUTPUT;                       \
 652                             break;                                            \
 653                           }                                                   \
 654                         *outptr++ = ESC;                                      \
 655                         *outptr++ = '$';                                      \
 656                         *outptr++ = '(';                                      \
 657                         *outptr++ = 'D';                                      \
 658                         set = JISX0212_set;                                   \
 659                         *outptr++ = buf[0];                                   \
 660                         *outptr++ = buf[1];                                   \
 661                       }                                                       \
 662                     else                                                      \
 663                       {                                                       \
 664                         written = ucs4_to_jisx0201 (ch, buf);                 \
 665                         if (written != UNKNOWN_10646_CHAR && buf[0] >= 0x80)  \
 666                           {                                                   \
 667                             /* We use JIS X 0201.  */                         \
 668                             if (NEED_LENGTH_TEST && outptr + 4 > outend)      \
 669                               {                                               \
 670                                 result = GCONV_FULL_OUTPUT;                   \
 671                                 break;                                        \
 672                               }                                               \
 673                                                                               \
 674                             *outptr++ = ESC;                                  \
 675                             *outptr++ = '(';                                  \
 676                             *outptr++ = 'I';                                  \
 677                             set = JISX0201_Kana_set;                          \
 678                             *outptr++ = buf[0] - 0x80;                        \
 679                           }                                                   \
 680                         else if (ch != 0xa5 && ch >= 0x80 && ch <= 0xff)      \
 681                           {                                                   \
 682                             /* ISO 8859-1 upper half.   */                    \
 683                             if (NEED_LENGTH_TEST && outptr + 6 > outend)      \
 684                               {                                               \
 685                                 result = GCONV_FULL_OUTPUT;                   \
 686                                 break;                                        \
 687                               }                                               \
 688                                                                               \
 689                             *outptr++ = ESC;                                  \
 690                             *outptr++ = '.';                                  \
 691                             *outptr++ = 'A';                                  \
 692                             set2 = ISO88591_set;                              \
 693                             *outptr++ = ESC;                                  \
 694                             *outptr++ = 'N';                                  \
 695                             *outptr++ = ch;                                   \
 696                           }                                                   \
 697                         else                                                  \
 698                           {                                                   \
 699                             written = ucs4_to_gb2312 (ch, buf, 2);            \
 700                             if (written != UNKNOWN_10646_CHAR)                \
 701                               {                                               \
 702                                 /* We use GB 2312.  */                        \
 703                                 if (NEED_LENGTH_TEST && outptr + 5 > outend)  \
 704                                   {                                           \
 705                                     result = GCONV_FULL_OUTPUT;               \
 706                                     break;                                    \
 707                                   }                                           \
 708                                                                               \
 709                                 *outptr++ = ESC;                              \
 710                                 *outptr++ = '$';                              \
 711                                 *outptr++ = 'A';                              \
 712                                 set = GB2312_set;                             \
 713                                 *outptr++ = buf[0];                           \
 714                                 *outptr++ = buf[1];                           \
 715                               }                                               \
 716                             else                                              \
 717                               {                                               \
 718                                 written = ucs4_to_ksc5601 (ch, buf, 2);       \
 719                                 if (written != UNKNOWN_10646_CHAR)            \
 720                                   {                                           \
 721                                     /* We use KSC 5601.  */                   \
 722                                     if (NEED_LENGTH_TEST                      \
 723                                         && outptr + 6 > outend)               \
 724                                       {                                       \
 725                                         result = GCONV_FULL_OUTPUT;           \
 726                                         break;                                \
 727                                       }                                       \
 728                                     *outptr++ = ESC;                          \
 729                                     *outptr++ = '$';                          \
 730                                     *outptr++ = '(';                          \
 731                                     *outptr++ = 'C';                          \
 732                                     set = KSC5601_set;                        \
 733                                     *outptr++ = buf[0];                       \
 734                                     *outptr++ = buf[1];                       \
 735                                   }                                           \
 736                                 else                                          \
 737                                   {                                           \
 738                                     const struct gap *rp = from_idx;          \
 739                                     unsigned char gch = 0;                    \
 740                                                                               \
 741                                     while (ch > rp->end)                      \
 742                                       ++rp;                                   \
 743                                     if (ch >= rp->start)                      \
 744                                       {                                       \
 745                                         ch = ch - 0xa0 + rp->idx;             \
 746                                         gch = iso88597_from_ucs4[ch];         \
 747                                       }                                       \
 748                                                                               \
 749                                     if (gch != 0)                             \
 750                                       {                                       \
 751                                         /* We use ISO 8859-7 greek.  */       \
 752                                         if (NEED_LENGTH_TEST                  \
 753                                             && outptr + 6 > outend)           \
 754                                           {                                   \
 755                                             result = GCONV_FULL_OUTPUT;       \
 756                                             break;                            \
 757                                           }                                   \
 758                                         *outptr++ = ESC;                      \
 759                                         *outptr++ = '.';                      \
 760                                         *outptr++ = 'F';                      \
 761                                         set2 = ISO88597_set;                  \
 762                                         *outptr++ = ESC;                      \
 763                                         *outptr++ = 'N';                      \
 764                                         *outptr++ = gch;                      \
 765                                       }                                       \
 766                                     else                                      \
 767                                       {                                       \
 768                                         result = GCONV_ILLEGAL_INPUT;         \
 769                                         break;                                \
 770                                       }                                       \
 771                                   }                                           \
 772                               }                                               \
 773                           }                                                   \
 774                       }                                                       \
 775                   }                                                           \
 776               }                                                               \
 777           }                                                                   \
 778       }                                                                       \
 779                                                                               \
 780     /* Now that we wrote the output increment the input pointer.  */          \
 781     inptr += 4;                                                               \
 782   }
 783 #define EXTRA_LOOP_DECLS        , enum variant var, int *setp
 784 #define INIT_PARAMS             int set = *setp % 0x100, set2 = *setp / 0x100
 785 #define UPDATE_PARAMS           *setp = (set2 << 8) + set
 786 #include <iconv/loop.c>
 787
 788
 789 /* Now define the toplevel functions.  */
 790 #include <iconv/skeleton.c>