Back to index

php5  5.3.10
Defines | Functions | Variables
mbfilter_euc_jp_win.c File Reference
#include "mbfilter.h"
#include "mbfilter_euc_jp_win.h"
#include "unicode_table_cp932_ext.h"
#include "unicode_table_jis.h"
#include "cp932_table.h"

Go to the source code of this file.

Defines

#define CK(statement)   do { if ((statement) < 0) return (-1); } while (0)

Functions

static int mbfl_filt_ident_eucjp_win (int c, mbfl_identify_filter *filter)
int mbfl_filt_conv_eucjpwin_wchar (int c, mbfl_convert_filter *filter)
int mbfl_filt_conv_wchar_eucjpwin (int c, mbfl_convert_filter *filter)

Variables

static const unsigned char mblen_table_eucjp []
static const char * mbfl_encoding_eucjp_win_aliases []
const mbfl_encoding mbfl_encoding_eucjp_win

Define Documentation

#define CK (   statement)    do { if ((statement) < 0) return (-1); } while (0)

Definition at line 100 of file mbfilter_euc_jp_win.c.


Function Documentation

int mbfl_filt_conv_eucjpwin_wchar ( int  c,
mbfl_convert_filter *  filter 
)

Definition at line 106 of file mbfilter_euc_jp_win.c.

{
       int c1, s, w, n;

       switch (filter->status) {
       case 0:
              if (c >= 0 && c < 0x80) {   /* latin */
                     CK((*filter->output_function)(c, filter->data));
              } else if (c > 0xa0 && c < 0xff) { /* CP932 first char */
                     filter->status = 1;
                     filter->cache = c;
              } else if (c == 0x8e) {     /* kana first char */
                     filter->status = 2;
              } else if (c == 0x8f) {     /* X 0212 first char */
                     filter->status = 3;
              } else {
                     w = c & MBFL_WCSGROUP_MASK;
                     w |= MBFL_WCSGROUP_THROUGH;
                     CK((*filter->output_function)(w, filter->data));
              }
              break;

       case 1:       /* got first half */
              filter->status = 0;
              c1 = filter->cache;
              if (c > 0xa0 && c < 0xff) {
                     w = 0;
                     s = (c1 - 0xa1)*94 + c - 0xa1;
                     if (s <= 137) {
                            if (s == 31) {
                                   w = 0xff3c;                 /* FULLWIDTH REVERSE SOLIDUS */
                            } else if (s == 32) {
                                   w = 0xff5e;                 /* FULLWIDTH TILDE */
                            } else if (s == 33) {
                                   w = 0x2225;                 /* PARALLEL TO */
                            } else if (s == 60) {
                                   w = 0xff0d;                 /* FULLWIDTH HYPHEN-MINUS */
                            } else if (s == 80) {
                                   w = 0xffe0;                 /* FULLWIDTH CENT SIGN */
                            } else if (s == 81) {
                                   w = 0xffe1;                 /* FULLWIDTH POUND SIGN */
                            } else if (s == 137) {
                                   w = 0xffe2;                 /* FULLWIDTH NOT SIGN */
                            }
                     }
                     if (w == 0) {
                            if (s >= cp932ext1_ucs_table_min && s < cp932ext1_ucs_table_max) {           /* vendor ext1 (13ku) */
                                   w = cp932ext1_ucs_table[s - cp932ext1_ucs_table_min];
                            } else if (s >= 0 && s < jisx0208_ucs_table_size) {            /* X 0208 */
                                   w = jisx0208_ucs_table[s];
                            } else if (s >= (84 * 94)) {              /* user (85ku - 94ku) */
                                   w = s - (84 * 94) + 0xe000;
                            }
                     }
                     if (w <= 0) {
                            w = ((c1 & 0x7f) << 8) | (c & 0x7f);
                            w &= MBFL_WCSPLANE_MASK;
                            w |= MBFL_WCSPLANE_WINCP932;
                     }
                     CK((*filter->output_function)(w, filter->data));
              } else if ((c >= 0 && c < 0x21) || c == 0x7f) {         /* CTLs */
                     CK((*filter->output_function)(c, filter->data));
              } else {
                     w = (c1 << 8) | c;
                     w &= MBFL_WCSGROUP_MASK;
                     w |= MBFL_WCSGROUP_THROUGH;
                     CK((*filter->output_function)(w, filter->data));
              }
              break;

       case 2:       /* got 0x8e, X0201 kana */
              filter->status = 0;
              if (c > 0xa0 && c < 0xe0) {
                     w = 0xfec0 + c;
                     CK((*filter->output_function)(w, filter->data));
              } else if ((c >= 0 && c < 0x21) || c == 0x7f) {         /* CTLs */
                     CK((*filter->output_function)(c, filter->data));
              } else {
                     w = 0x8e00 | c;
                     w &= MBFL_WCSGROUP_MASK;
                     w |= MBFL_WCSGROUP_THROUGH;
                     CK((*filter->output_function)(w, filter->data));
              }
              break;

       case 3:       /* got 0x8f,  X 0212 first char */
              if ((c >= 0 && c < 0x21) || c == 0x7f) {         /* CTLs */
                     CK((*filter->output_function)(c, filter->data));
                     filter->status = 0;
              } else {
                     filter->status++;
                     filter->cache = c;
              }
              break;
       case 4:       /* got 0x8f,  X 0212 second char */
              filter->status = 0;
              c1 = filter->cache;
              if (c1 > 0xa0 && c1 < 0xff && c > 0xa0 && c < 0xff) {
                     s = (c1 - 0xa1)*94 + c - 0xa1;
                     if (s >= 0 && s < jisx0212_ucs_table_size) {
                            w = jisx0212_ucs_table[s];
                            if (w == 0x007e) {
                                   w = 0xff5e;          /* FULLWIDTH TILDE */
                            }
                     } else if (s >= (82*94) && s < (84*94)) { /* vender ext3 (83ku - 84ku) <-> CP932 (115ku -120ku) */
                            s = (c1<< 8) | c;
                            w = 0;
                            n = 0;
                            while (n < cp932ext3_eucjp_table_size) {
                                   if (s == cp932ext3_eucjp_table[n]) {
                                          if (n < (cp932ext3_ucs_table_max - cp932ext3_ucs_table_min)) {
                                                 w = cp932ext3_ucs_table[n];
                                          }
                                          break;
                                   }
                                   n++;
                            }
                     } else if (s >= (84*94)) {         /* user (85ku - 94ku) */
                            w = s - (84*94) + (0xe000 + (94*10));
                     } else {
                            w = 0;
                     }
                     if (w == 0x00A6) {
                            w = 0xFFE4;          /* FULLWIDTH BROKEN BAR */
                     }
                     if (w <= 0) {
                            w = ((c1 & 0x7f) << 8) | (c & 0x7f);
                            w &= MBFL_WCSPLANE_MASK;
                            w |= MBFL_WCSPLANE_JIS0212;
                     }
                     CK((*filter->output_function)(w, filter->data));
              } else if ((c >= 0 && c < 0x21) || c == 0x7f) {         /* CTLs */
                     CK((*filter->output_function)(c, filter->data));
              } else {
                     w = (c1 << 8) | c | 0x8f0000;
                     w &= MBFL_WCSGROUP_MASK;
                     w |= MBFL_WCSGROUP_THROUGH;
                     CK((*filter->output_function)(w, filter->data));
              }
              break;

       default:
              filter->status = 0;
              break;
       }

       return c;
}
int mbfl_filt_conv_wchar_eucjpwin ( int  c,
mbfl_convert_filter *  filter 
)

Definition at line 259 of file mbfilter_euc_jp_win.c.

{
       int c1, c2, s1;

       s1 = 0;
       if (c >= ucs_a1_jis_table_min && c < ucs_a1_jis_table_max) {
              s1 = ucs_a1_jis_table[c - ucs_a1_jis_table_min];
       } else if (c >= ucs_a2_jis_table_min && c < ucs_a2_jis_table_max) {
              s1 = ucs_a2_jis_table[c - ucs_a2_jis_table_min];
       } else if (c >= ucs_i_jis_table_min && c < ucs_i_jis_table_max) {
              s1 = ucs_i_jis_table[c - ucs_i_jis_table_min];
       } else if (c >= ucs_r_jis_table_min && c < ucs_r_jis_table_max) {
              s1 = ucs_r_jis_table[c - ucs_r_jis_table_min];
       } else if (c >= 0xe000 && c < (0xe000 + 10*94)) {       /* user  (X0208  85ku - 94ku) */
              s1 = c - 0xe000;
              c1 = s1/94 + 0x75;
              c2 = s1%94 + 0x21;
              s1 = (c1 << 8) | c2;
       } else if (c >= (0xe000 + 10*94) && c < (0xe000 + 20*94)) {    /* user  (X0212  85ku - 94ku) */
              s1 = c - (0xe000 + 10*94);
              c1 = s1/94 + 0xf5;
              c2 = s1%94 + 0xa1;
              s1 = (c1 << 8) | c2;
       }
       if (s1 == 0xa2f1) {
              s1 = 0x2d62;         /* NUMERO SIGN */
       }
       if (s1 <= 0) {
              c1 = c & ~MBFL_WCSPLANE_MASK;
              if (c1 == MBFL_WCSPLANE_WINCP932) {
                     s1 = c & MBFL_WCSPLANE_MASK;
                     if (s1 >= ((85 + 0x20) << 8)) {    /* 85ku - 120ku */
                            s1 = -1;
                     }
              } else if (c1 == MBFL_WCSPLANE_JIS0208) {
                     s1 = c & MBFL_WCSPLANE_MASK;
                     if (s1 >= ((85 + 0x20) << 8)) {    /* 85ku - 94ku */
                            s1 = -1;
                     }
              } else if (c1 == MBFL_WCSPLANE_JIS0212) {
                     s1 = c & MBFL_WCSPLANE_MASK;
                     if (s1 >= ((83 + 0x20) << 8)) {    /* 83ku - 94ku */
                            s1 = -1;
                     } else {
                            s1 |= 0x8080;
                     }
              } else if (c == 0xa5) {            /* YEN SIGN */
                     s1 = 0x216f;                /* FULLWIDTH YEN SIGN */
              } else if (c == 0x203e) {   /* OVER LINE */
                     s1 = 0x2131;                /* FULLWIDTH MACRON */
              } else if (c == 0xff3c) {   /* FULLWIDTH REVERSE SOLIDUS */
                     s1 = 0x2140;
              } else if (c == 0xff5e) {   /* FULLWIDTH TILDE */
                     s1 = 0x2141;
              } else if (c == 0x2225) {   /* PARALLEL TO */
                     s1 = 0x2142;
              } else if (c == 0xff0d) {   /* FULLWIDTH HYPHEN-MINUS */
                     s1 = 0x215d;
              } else if (c == 0xffe0) {   /* FULLWIDTH CENT SIGN */
                     s1 = 0x2171;
              } else if (c == 0xffe1) {   /* FULLWIDTH POUND SIGN */
                     s1 = 0x2172;
              } else if (c == 0xffe2) {   /* FULLWIDTH NOT SIGN */
                     s1 = 0x224c;
              } else if (c == 0xff5e) {   /* FULLWIDTH TILDE */
                     s1 = 0x2141;
              } else {
                     s1 = -1;
                     c1 = 0;
                     c2 = cp932ext1_ucs_table_max - cp932ext1_ucs_table_min;
                     while (c1 < c2) {           /* CP932 vendor ext1 (13ku) */
                            const int oh = cp932ext1_ucs_table_min / 94;

                            if (c == cp932ext1_ucs_table[c1]) {
                                   s1 = ((c1 / 94 + oh + 0x21) << 8) + (c1 % 94 + 0x21);
                                   break;
                            }
                            c1++;
                     }
                     if (s1 < 0) {
                            c1 = 0;
                            c2 = cp932ext3_ucs_table_max - cp932ext3_ucs_table_min;
                            while (c1 < c2) {           /* CP932 vendor ext3 (115ku - 119ku) */
                                   if (c == cp932ext3_ucs_table[c1]) {
                                          if (c1 < cp932ext3_eucjp_table_size) {
                                                 s1 = cp932ext3_eucjp_table[c1];
                                          }
                                          break;
                                   }
                                   c1++;
                            }
                     }
              }
              if (c == 0) {
                     s1 = 0;
              } else if (s1 <= 0) {
                     s1 = -1;
              }
       }

       if (s1 >= 0) {
              if (s1 < 0x80) {     /* latin */
                     CK((*filter->output_function)(s1, filter->data));
              } else if (s1 < 0x100) {    /* kana */
                     CK((*filter->output_function)(0x8e, filter->data));
                     CK((*filter->output_function)(s1, filter->data));
              } else if (s1 < 0x8080)  {  /* X 0208 */
                     CK((*filter->output_function)(((s1 >> 8) & 0xff) | 0x80, filter->data));
                     CK((*filter->output_function)((s1 & 0xff) | 0x80, filter->data));
              } else {      /* X 0212 */
                     CK((*filter->output_function)(0x8f, filter->data));
                     CK((*filter->output_function)(((s1 >> 8) & 0xff) | 0x80, filter->data));
                     CK((*filter->output_function)((s1 & 0xff) | 0x80, filter->data));
              }
       } else {
              if (filter->illegal_mode != MBFL_OUTPUTFILTER_ILLEGAL_MODE_NONE) {
                     CK(mbfl_filt_conv_illegal_output(c, filter));
              }
       }

       return c;
}

Here is the call graph for this function:

static int mbfl_filt_ident_eucjp_win ( int  c,
mbfl_identify_filter *  filter 
) [static]

Definition at line 382 of file mbfilter_euc_jp_win.c.

{
       switch (filter->status) {
       case  0:      /* latin */
              if (c >= 0 && c < 0x80) {   /* ok */
                     ;
              } else if (c > 0xa0 && c < 0xff) { /* kanji first char */
                     filter->status = 1;
              } else if (c == 0x8e) {                          /* kana first char */
                     filter->status = 2;
              } else if (c == 0x8f) {                          /* X 0212 first char */
                     filter->status = 3;
              } else {                                                /* bad */
                     filter->flag = 1;
              }
              break;

       case  1:      /* got first half */
              if (c < 0xa1 || c > 0xfe) {        /* bad */
                     filter->flag = 1;
              }
              filter->status = 0;
              break;

       case  2:      /* got 0x8e */
              if (c < 0xa1 || c > 0xdf) {        /* bad */
                     filter->flag = 1;
              }
              filter->status = 0;
              break;

       case  3:      /* got 0x8f */
              if (c < 0xa1 || c > 0xfe) {        /* bad */
                     filter->flag = 1;
              }
              filter->status++;
              break;
       case  4:      /* got 0x8f */
              if (c < 0xa1 || c > 0xfe) {        /* bad */
                     filter->flag = 1;
              }
              filter->status = 0;
              break;

       default:
              filter->status = 0;
              break;
       }

       return c;
}

Variable Documentation

Initial value:

Definition at line 73 of file mbfilter_euc_jp_win.c.

const char* mbfl_encoding_eucjp_win_aliases[] [static]
Initial value:
 {"eucJP-open", 
                                                 "eucJP-ms", NULL}

Definition at line 63 of file mbfilter_euc_jp_win.c.

const unsigned char mblen_table_eucjp[] [static]
Initial value:
 { 
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 2, 3,
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
  1, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
  2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
  2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
  2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
  2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
  2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 1
}

Definition at line 43 of file mbfilter_euc_jp_win.c.