File: iconv_hook_mssjis.c

package info (click to toggle)
libapache-mod-encoding 0.0.20021209-12
  • links: PTS
  • area: main
  • in suites: bookworm, forky, sid, trixie
  • size: 1,700 kB
  • sloc: ansic: 94,406; sh: 6,693; makefile: 43
file content (129 lines) | stat: -rw-r--r-- 3,168 bytes parent folder | download | duplicates (5)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
/* -*- mode: c -*-
 *
 * $Id: iconv_hook_mssjis.c,v 1.3 2002/06/10 13:24:49 tai Exp $
 * Framework Author: Taisuke Yamada (tai@iij.ad.jp)
 * Logic Composer:   Kunio Miyamoto (wakatono@todo.gr.jp)
 */

#include <sys/types.h>
#include <string.h>
#include <dirent.h>
#include <unistd.h>

#include "iconv_hook.h"
#include "cp.h"

#define	MSSJISENC	"MSSJIS"
#define is_zen(c) \
        ((0x81 <= ((unsigned char) (c)) && ((unsigned char) (c)) <= 0x9f) \
        || (0xe0 <= ((unsigned char) (c)) && ((unsigned char) (c)) <= 0xfc))
#define is_han(c) \
        ((0xa0 <= ((unsigned char) (c)) && ((unsigned char) (c)) <= 0xdf))

static size_t skip_bytes(char c)
{
  if(is_zen(c)) {
    return 2;
  } else if (is_han(c)) {
    return 1;
  }
  return 0;
}

/*
 * mssjis_iconv_open()
 * by Kunio Miyamoto (wakatono@todo.gr.jp)
 * This code is for iconv() interface compatibility.
 * and processes nothing but returns normal return code(fixes to 1).
 */
 
static iconv_t
mssjis_iconv_open(const char *oenc, const char *ienc) {
  if( (strncmp(ienc,MSSJISENC,6) == 0) && (strncmp(oenc,"UTF-8",5) == 0) )
  {
  	return (iconv_t)1;
  }
  else
  {
  	return (iconv_t)-1;
  }
}

/*
 * mssjis_iconv_close() 
 * by Kunio Miyamoto (wakatono@todo.gr.jp)
 * This code is for iconv() interface compatibility.
 * and processes nothing but returns normal return code(fixes to 1).
 */
 
static int
mssjis_iconv_close(iconv_t cd) {
  return 0;
}

/* mssjis_iconv()
 * by Kunio Miyamoto (wakatono@todo.gr.jp)
 *  Microsoft ShiftJIS code to UTF-8 
 * This is experimental code for processing Microsoft Shift JIS Code :-(
 * This routine uses fixed table cp[] in "cp.h" , and does'nt be needed to
 * load conversion table.
 */
 
size_t
mssjis_iconv(iconv_t cd,
	    char **srcbuf, size_t *srclen, char **outbuf, size_t *outlen) {
  unsigned char *dst;
  unsigned char *src;
  unsigned short utf8code;
  int sjiscode;
  size_t len;
  unsigned char *to2;

  if (! (srcbuf && srclen && outbuf && outlen))
    return 0;

  src = (unsigned char *)*srcbuf;
  dst = to2 = malloc(*outlen);
  while (*src && ((dst - to2) < (*outlen - 4))) {
    len = skip_bytes(*src);
    if ( len == 2 ) {
      sjiscode = (int)(*src++ & 0xff);
      sjiscode = (int)((sjiscode << 8)|(*src++ & 0xff));
    } else {
      sjiscode = (int)(*src++ & 0xff);
    }
    utf8code = cp[sjiscode]; /* convert sjis code to utf8 (cp[] is conversion table array) */

    if ( utf8code <= 0x7f ) {
      *dst++ = (char)(utf8code & 0xff);
    } else if ( utf8code <= 0x7ff ){
      *dst++ = (char)( 0xc0 | ((utf8code >> 6) & 0xff));
      *dst++ = (char)( 0x80 | ( utf8code & 0x3f ));
    } else {
      *dst++ = (char)( 0xe0 | ((utf8code >> 12) & 0x0f));
      *dst++ = (char)( 0x80 | ((utf8code >> 6)  & 0x3f));
      *dst++ = (char)( 0x80 | (utf8code & 0x3f));
    }

  }
  *dst++='\0';
  memcpy(*outbuf,to2,*outlen);
  free(to2);
  *srcbuf += *src;
  *srclen = 0;
  *outbuf = dst;
  *outlen = strlen(*outbuf);
  return strlen(*outbuf);
}

static iconv_hook_module iconv_hook_mssjis = {
  mssjis_iconv,
  mssjis_iconv_open,
  mssjis_iconv_close,
};

iconv_hook_module *
iconv_hook_mssjis_init(void) {
  return &iconv_hook_mssjis;
}