Back to index

php5  5.3.10
Defines | Functions | Variables
mbfilter_jis.c File Reference
#include "mbfilter.h"
#include "mbfilter_jis.h"
#include "unicode_table_cp932_ext.h"
#include "unicode_table_jis.h"

Go to the source code of this file.

Defines

#define CK(statement)   do { if ((statement) < 0) return (-1); } while (0)

Functions

static int mbfl_filt_ident_jis (int c, mbfl_identify_filter *filter)
static int mbfl_filt_ident_2022jp (int c, mbfl_identify_filter *filter)
int mbfl_filt_conv_jis_wchar (int c, mbfl_convert_filter *filter)
int mbfl_filt_conv_wchar_jis (int c, mbfl_convert_filter *filter)
int mbfl_filt_conv_wchar_2022jp (int c, mbfl_convert_filter *filter)
int mbfl_filt_conv_any_jis_flush (mbfl_convert_filter *filter)

Variables

const mbfl_encoding mbfl_encoding_jis
const mbfl_encoding mbfl_encoding_2022jp

Define Documentation

#define CK (   statement)    do { if ((statement) < 0) return (-1); } while (0)

Definition at line 111 of file mbfilter_jis.c.


Function Documentation

int mbfl_filt_conv_any_jis_flush ( mbfl_convert_filter *  filter)

Definition at line 472 of file mbfilter_jis.c.

{
       /* back to latin */
       if ((filter->status & 0xff00) != 0) {
              CK((*filter->output_function)(0x1b, filter->data));            /* ESC */
              CK((*filter->output_function)(0x28, filter->data));            /* '(' */
              CK((*filter->output_function)(0x42, filter->data));            /* 'B' */
       }
       filter->status &= 0xff;

       if (filter->flush_function != NULL) {
              return (*filter->flush_function)(filter->data);
       }

       return 0;
}
int mbfl_filt_conv_jis_wchar ( int  c,
mbfl_convert_filter *  filter 
)

Definition at line 117 of file mbfilter_jis.c.

{
       int c1, s, w;

retry:
       switch (filter->status & 0xf) {
/*     case 0x00:     ASCII */
/*     case 0x10:     X 0201 latin */
/*     case 0x20:     X 0201 kana */
/*     case 0x80:     X 0208 */
/*     case 0x90:     X 0212 */
       case 0:
              if (c == 0x1b) {
                     filter->status += 2;
              } else if (c == 0x0e) {            /* "kana in" */
                     filter->status = 0x20;
              } else if (c == 0x0f) {            /* "kana out" */
                     filter->status = 0;
              } else if (filter->status == 0x10 && c == 0x5c) {       /* YEN SIGN */
                     CK((*filter->output_function)(0xa5, filter->data));
              } else if (filter->status == 0x10 && c == 0x7e) {       /* OVER LINE */
                     CK((*filter->output_function)(0x203e, filter->data));
              } else if (filter->status == 0x20 && c > 0x20 && c < 0x60) {          /* kana */
                     CK((*filter->output_function)(0xff40 + c, filter->data));
              } else if ((filter->status == 0x80 || filter->status == 0x90) && c > 0x20 && c < 0x7f) {          /* kanji first char */
                     filter->cache = c;
                     filter->status += 1;
              } else if (c >= 0 && c < 0x80) {          /* latin, CTLs */
                     CK((*filter->output_function)(c, filter->data));
              } else if (c > 0xa0 && c < 0xe0) { /* GR kana */
                     CK((*filter->output_function)(0xfec0 + c, filter->data));
              } else {
                     w = c & MBFL_WCSGROUP_MASK;
                     w |= MBFL_WCSGROUP_THROUGH;
                     CK((*filter->output_function)(w, filter->data));
              }
              break;

/*     case 0x81:     X 0208 second char */
/*     case 0x91:     X 0212 second char */
       case 1:
              filter->status &= ~0xf;
              c1 = filter->cache;
              if (c > 0x20 && c < 0x7f) {
                     s = (c1 - 0x21)*94 + c - 0x21;
                     if (filter->status == 0x80) {
                            if (s >= 0 && s < jisx0208_ucs_table_size) {
                                   w = jisx0208_ucs_table[s];
                            } else {
                                   w = 0;
                            }
                            if (w <= 0) {
                                   w = (c1 << 8) | c;
                                   w &= MBFL_WCSPLANE_MASK;
                                   w |= MBFL_WCSPLANE_JIS0208;
                            }
                     } else {
                            if (s >= 0 && s < jisx0212_ucs_table_size) {
                                   w = jisx0212_ucs_table[s];
                            } else {
                                   w = 0;
                            }
                            if (w <= 0) {
                                   w = (c1 << 8) | c;
                                   w &= MBFL_WCSPLANE_MASK;
                                   w |= MBFL_WCSPLANE_JIS0212;
                            }
                     }
                     CK((*filter->output_function)(w, filter->data));
              } else if (c == 0x1b) {
                     filter->status += 2;
              } else if ((c >= 0 && c < 0x21) || c == 0x7f) {         /* CTLs */
                     CK((*filter->output_function)(c, filter->data));
              } else {
                     w = (c1 << 8) | c;
                     w &= MBFL_WCSGROUP_MASK;
                     w |= MBFL_WCSGROUP_THROUGH;
                     CK((*filter->output_function)(w, filter->data));
              }
              break;

       /* ESC */
/*     case 0x02:    */
/*     case 0x12:    */
/*     case 0x22:    */
/*     case 0x82:    */
/*     case 0x92:    */
       case 2:
              if (c == 0x24) {            /* '$' */
                     filter->status++;
              } else if (c == 0x28) {            /* '(' */
                     filter->status += 3;
              } else {
                     filter->status &= ~0xf;
                     CK((*filter->output_function)(0x1b, filter->data));
                     goto retry;
              }
              break;

       /* ESC $ */
/*     case 0x03:    */
/*     case 0x13:    */
/*     case 0x23:    */
/*     case 0x83:    */
/*     case 0x93:    */
       case 3:
              if (c == 0x40 || c == 0x42) {      /* '@' or 'B' */
                     filter->status = 0x80;
              } else if (c == 0x28) {                   /* '(' */
                     filter->status++;
              } else {
                     filter->status &= ~0xf;
                     CK((*filter->output_function)(0x1b, filter->data));
                     CK((*filter->output_function)(0x24, filter->data));
                     goto retry;
              }
              break;

       /* ESC $ ( */
/*     case 0x04:    */
/*     case 0x14:    */
/*     case 0x24:    */
/*     case 0x84:    */
/*     case 0x94:    */
       case 4:
              if (c == 0x40 || c == 0x42) {      /* '@' or 'B' */
                     filter->status = 0x80;
              } else if (c == 0x44) {                   /* 'D' */
                     filter->status = 0x90;
              } else {
                     filter->status &= ~0xf;
                     CK((*filter->output_function)(0x1b, filter->data));
                     CK((*filter->output_function)(0x24, filter->data));
                     CK((*filter->output_function)(0x28, filter->data));
                     goto retry;
              }
              break;

       /* ESC ( */
/*     case 0x05:    */
/*     case 0x15:    */
/*     case 0x25:    */
/*     case 0x85:    */
/*     case 0x95:    */
       case 5:
              if (c == 0x42 || c == 0x48) {             /* 'B' or 'H' */
                     filter->status = 0;
              } else if (c == 0x4a) {            /* 'J' */
                     filter->status = 0x10;
              } else if (c == 0x49) {            /* 'I' */
                     filter->status = 0x20;
              } else {
                     filter->status &= ~0xf;
                     CK((*filter->output_function)(0x1b, filter->data));
                     CK((*filter->output_function)(0x28, filter->data));
                     goto retry;
              }
              break;

       default:
              filter->status = 0;
              break;
       }

       return c;
}
int mbfl_filt_conv_wchar_2022jp ( int  c,
mbfl_convert_filter *  filter 
)

Definition at line 393 of file mbfilter_jis.c.

{
       int s;

       s = 0;
       if (c >= ucs_a1_jis_table_min && c < ucs_a1_jis_table_max) {
              s = ucs_a1_jis_table[c - ucs_a1_jis_table_min];
       } else if (c >= ucs_a2_jis_table_min && c < ucs_a2_jis_table_max) {
              s = ucs_a2_jis_table[c - ucs_a2_jis_table_min];
       } else if (c >= ucs_i_jis_table_min && c < ucs_i_jis_table_max) {
              s = ucs_i_jis_table[c - ucs_i_jis_table_min];
       } else if (c >= ucs_r_jis_table_min && c < ucs_r_jis_table_max) {
              s = ucs_r_jis_table[c - ucs_r_jis_table_min];
       }
       if (s <= 0) {
              if (c == 0xa5) {                   /* YEN SIGN */
                     s = 0x1005c;
              } else if (c == 0x203e) {   /* OVER LINE */
                     s = 0x1007e;
              } else if (c == 0xff3c) {   /* FULLWIDTH REVERSE SOLIDUS */
                     s = 0x2140;
              } else if (c == 0xff5e) {   /* FULLWIDTH TILDE */
                     s = 0x2141;
              } else if (c == 0x2225) {   /* PARALLEL TO */
                     s = 0x2142;
              } else if (c == 0xff0d) {   /* FULLWIDTH HYPHEN-MINUS */
                     s = 0x215d;
              } else if (c == 0xffe0) {   /* FULLWIDTH CENT SIGN */
                     s = 0x2171;
              } else if (c == 0xffe1) {   /* FULLWIDTH POUND SIGN */
                     s = 0x2172;
              } else if (c == 0xffe2) {   /* FULLWIDTH NOT SIGN */
                     s = 0x224c;
              }
              if (c == 0) {
                     s = 0;
              } else if (s <= 0) {
                     s = -1;
              }
       } else if ((s >= 0x80 && s < 0x2121) || (s > 0x8080)) {
              s = -1;
       }
       if (s >= 0) {
              if (s < 0x80) { /* ASCII */
                     if ((filter->status & 0xff00) != 0) {
                            CK((*filter->output_function)(0x1b, filter->data));            /* ESC */
                            CK((*filter->output_function)(0x28, filter->data));            /* '(' */
                            CK((*filter->output_function)(0x42, filter->data));            /* 'B' */
                     }
                     filter->status = 0;
                     CK((*filter->output_function)(s, filter->data));
              } else if (s < 0x10000) { /* X 0208 */
                     if ((filter->status & 0xff00) != 0x200) {
                            CK((*filter->output_function)(0x1b, filter->data));            /* ESC */
                            CK((*filter->output_function)(0x24, filter->data));            /* '$' */
                            CK((*filter->output_function)(0x42, filter->data));            /* 'B' */
                     }
                     filter->status = 0x200;
                     CK((*filter->output_function)((s >> 8) & 0x7f, filter->data));
                     CK((*filter->output_function)(s & 0x7f, filter->data));
              } else { /* X 0201 latin */
                     if ((filter->status & 0xff00) != 0x400) {
                            CK((*filter->output_function)(0x1b, filter->data));            /* ESC */
                            CK((*filter->output_function)(0x28, filter->data));            /* '(' */
                            CK((*filter->output_function)(0x4a, filter->data));            /* 'J' */
                     }
                     filter->status = 0x400;
                     CK((*filter->output_function)(s & 0x7f, filter->data));
              }
       } else {
              if (filter->illegal_mode != MBFL_OUTPUTFILTER_ILLEGAL_MODE_NONE) {
                     CK(mbfl_filt_conv_illegal_output(c, filter));
              }
       }

       return c;
}

Here is the call graph for this function:

int mbfl_filt_conv_wchar_jis ( int  c,
mbfl_convert_filter *  filter 
)

Definition at line 288 of file mbfilter_jis.c.

{
       int c1, s;

       s = 0;
       if (c >= ucs_a1_jis_table_min && c < ucs_a1_jis_table_max) {
              s = ucs_a1_jis_table[c - ucs_a1_jis_table_min];
       } else if (c >= ucs_a2_jis_table_min && c < ucs_a2_jis_table_max) {
              s = ucs_a2_jis_table[c - ucs_a2_jis_table_min];
       } else if (c >= ucs_i_jis_table_min && c < ucs_i_jis_table_max) {
              s = ucs_i_jis_table[c - ucs_i_jis_table_min];
       } else if (c >= ucs_r_jis_table_min && c < ucs_r_jis_table_max) {
              s = ucs_r_jis_table[c - ucs_r_jis_table_min];
       }
       if (s <= 0) {
              c1 = c & ~MBFL_WCSPLANE_MASK;
              if (c1 == MBFL_WCSPLANE_JIS0208) {
                     s = c & MBFL_WCSPLANE_MASK;
              } else if (c1 == MBFL_WCSPLANE_JIS0212) {
                     s = c & MBFL_WCSPLANE_MASK;
                     s |= 0x8080;
              } else if (c == 0xa5) {            /* YEN SIGN */
                     s = 0x1005c;
              } else if (c == 0x203e) {   /* OVER LINE */
                     s = 0x1007e;
              } else if (c == 0xff3c) {   /* FULLWIDTH REVERSE SOLIDUS */
                     s = 0x2140;
              } else if (c == 0xff5e) {   /* FULLWIDTH TILDE */
                     s = 0x2141;
              } else if (c == 0x2225) {   /* PARALLEL TO */
                     s = 0x2142;
              } else if (c == 0xff0d) {   /* FULLWIDTH HYPHEN-MINUS */
                     s = 0x215d;
              } else if (c == 0xffe0) {   /* FULLWIDTH CENT SIGN */
                     s = 0x2171;
              } else if (c == 0xffe1) {   /* FULLWIDTH POUND SIGN */
                     s = 0x2172;
              } else if (c == 0xffe2) {   /* FULLWIDTH NOT SIGN */
                     s = 0x224c;
              }
              if (c == 0) {
                     s = 0;
              } else if (s <= 0) {
                     s = -1;
              }
       }
       if (s >= 0) {
              if (s < 0x80) { /* ASCII */
                     if ((filter->status & 0xff00) != 0) {
                            CK((*filter->output_function)(0x1b, filter->data));            /* ESC */
                            CK((*filter->output_function)(0x28, filter->data));            /* '(' */
                            CK((*filter->output_function)(0x42, filter->data));            /* 'B' */
                     }
                     filter->status = 0;
                     CK((*filter->output_function)(s, filter->data));
              } else if (s < 0x100) { /* kana */
                     if ((filter->status & 0xff00) != 0x100) {
                            CK((*filter->output_function)(0x1b, filter->data));            /* ESC */
                            CK((*filter->output_function)(0x28, filter->data));            /* '(' */
                            CK((*filter->output_function)(0x49, filter->data));            /* 'I' */
                     }
                     filter->status = 0x100;
                     CK((*filter->output_function)(s & 0x7f, filter->data));
              } else if (s < 0x8080) { /* X 0208 */
                     if ((filter->status & 0xff00) != 0x200) {
                            CK((*filter->output_function)(0x1b, filter->data));            /* ESC */
                            CK((*filter->output_function)(0x24, filter->data));            /* '$' */
                            CK((*filter->output_function)(0x42, filter->data));            /* 'B' */
                     }
                     filter->status = 0x200;
                     CK((*filter->output_function)((s >> 8) & 0x7f, filter->data));
                     CK((*filter->output_function)(s & 0x7f, filter->data));
              } else if (s < 0x10000) { /* X 0212 */
                     if ((filter->status & 0xff00) != 0x300) {
                            CK((*filter->output_function)(0x1b, filter->data));            /* ESC */
                            CK((*filter->output_function)(0x24, filter->data));            /* '$' */
                            CK((*filter->output_function)(0x28, filter->data));            /* '(' */
                            CK((*filter->output_function)(0x44, filter->data));            /* 'D' */
                     }
                     filter->status = 0x300;
                     CK((*filter->output_function)((s >> 8) & 0x7f, filter->data));
                     CK((*filter->output_function)(s & 0x7f, filter->data));
              } else { /* X 0201 latin */
                     if ((filter->status & 0xff00) != 0x400) {
                            CK((*filter->output_function)(0x1b, filter->data));            /* ESC */
                            CK((*filter->output_function)(0x28, filter->data));            /* '(' */
                            CK((*filter->output_function)(0x4a, filter->data));            /* 'J' */
                     }
                     filter->status = 0x400;
                     CK((*filter->output_function)(s & 0x7f, filter->data));
              }
       } else {
              if (filter->illegal_mode != MBFL_OUTPUTFILTER_ILLEGAL_MODE_NONE) {
                     CK(mbfl_filt_conv_illegal_output(c, filter));
              }
       }

       return c;
}

Here is the call graph for this function:

static int mbfl_filt_ident_2022jp ( int  c,
mbfl_identify_filter *  filter 
) [static]

Definition at line 587 of file mbfilter_jis.c.

{
retry:
       switch (filter->status & 0xf) {
/*     case 0x00:     ASCII */
/*     case 0x10:     X 0201 latin */
/*     case 0x80:     X 0208 */
       case 0:
              if (c == 0x1b) {
                     filter->status += 2;
              } else if (filter->status == 0x80 && c > 0x20 && c < 0x7f) {          /* kanji first char */
                     filter->status += 1;
              } else if (c >= 0 && c < 0x80) {          /* latin, CTLs */
                     ;
              } else {
                     filter->flag = 1;    /* bad */
              }
              break;

/*     case 0x81:     X 0208 second char */
       case 1:
              if (c == 0x1b) {
                     filter->status++;
              } else {
                     filter->status &= ~0xf;
                     if (c < 0x21 || c > 0x7e) {        /* bad */
                            filter->flag = 1;
                     }
              }
              break;

       /* ESC */
       case 2:
              if (c == 0x24) {            /* '$' */
                     filter->status++;
              } else if (c == 0x28) {            /* '(' */
                     filter->status += 3;
              } else {
                     filter->flag = 1;    /* bad */
                     filter->status &= ~0xf;
                     goto retry;
              }
              break;

       /* ESC $ */
       case 3:
              if (c == 0x40 || c == 0x42) {             /* '@' or 'B' */
                     filter->status = 0x80;
              } else {
                     filter->flag = 1;    /* bad */
                     filter->status &= ~0xf;
                     goto retry;
              }
              break;

       /* ESC ( */
       case 5:
              if (c == 0x42) {            /* 'B' */
                     filter->status = 0;
              } else if (c == 0x4a) {            /* 'J' */
                     filter->status = 0x10;
              } else {
                     filter->flag = 1;    /* bad */
                     filter->status &= ~0xf;
                     goto retry;
              }
              break;

       default:
              filter->status = 0;
              break;
       }

       return c;
}
static int mbfl_filt_ident_jis ( int  c,
mbfl_identify_filter *  filter 
) [static]

Definition at line 489 of file mbfilter_jis.c.

{
retry:
       switch (filter->status & 0xf) {
/*     case 0x00:     ASCII */
/*     case 0x10:     X 0201 latin */
/*     case 0x20:     X 0201 kana */
/*     case 0x80:     X 0208 */
/*     case 0x90:     X 0212 */
       case 0:
              if (c == 0x1b) {
                     filter->status += 2;
              } else if (c == 0x0e) {                   /* "kana in" */
                     filter->status = 0x20;
              } else if (c == 0x0f) {                   /* "kana out" */
                     filter->status = 0;
              } else if ((filter->status == 0x80 || filter->status == 0x90) && c > 0x20 && c < 0x7f) {          /* kanji first char */
                     filter->status += 1;
              } else if (c >= 0 && c < 0x80) {          /* latin, CTLs */
                     ;
              } else {
                     filter->flag = 1;    /* bad */
              }
              break;

/*     case 0x81:     X 0208 second char */
/*     case 0x91:     X 0212 second char */
       case 1:
              filter->status &= ~0xf;
              if (c == 0x1b) {
                     goto retry;
              } else if (c < 0x21 || c > 0x7e) {        /* bad */
                     filter->flag = 1;
              }
              break;

       /* ESC */
       case 2:
              if (c == 0x24) {            /* '$' */
                     filter->status++;
              } else if (c == 0x28) {            /* '(' */
                     filter->status += 3;
              } else {
                     filter->flag = 1;    /* bad */
                     filter->status &= ~0xf;
                     goto retry;
              }
              break;

       /* ESC $ */
       case 3:
              if (c == 0x40 || c == 0x42) {             /* '@' or 'B' */
                     filter->status = 0x80;
              } else if (c == 0x28) {            /* '(' */
                     filter->status++;
              } else {
                     filter->flag = 1;    /* bad */
                     filter->status &= ~0xf;
                     goto retry;
              }
              break;

       /* ESC $ ( */
       case 4:
              if (c == 0x40 || c == 0x42) {             /* '@' or 'B' */
                     filter->status = 0x80;
              } else if (c == 0x44) {            /* 'D' */
                     filter->status = 0x90;
              } else {
                     filter->flag = 1;    /* bad */
                     filter->status &= ~0xf;
                     goto retry;
              }
              break;

       /* ESC ( */
       case 5:
              if (c == 0x42 || c == 0x48) {             /* 'B' or 'H' */
                     filter->status = 0;
              } else if (c == 0x4a) {            /* 'J' */
                     filter->status = 0x10;
              } else if (c == 0x49) {            /* 'I' */
                     filter->status = 0x20;
              } else {
                     filter->flag = 1;    /* bad */
                     filter->status &= ~0xf;
                     goto retry;
              }
              break;

       default:
              filter->status = 0;
              break;
       }

       return c;
}

Variable Documentation

Initial value:

Definition at line 52 of file mbfilter_jis.c.

Initial value:

Definition at line 43 of file mbfilter_jis.c.