#include <stdio.h>
#include <errno.h>
#include <stdlib.h>
#include <sys/types.h>
#define __NEED_UNI_2_TCVN__
#include <unicode_tcvn.h>
#include "common_defs.h"
#define NON_ID_CHAR '?'
typedef struct _icv_state {
int _errno;
} _iconv_st;
void *
_icv_open()
{
_iconv_st *st;
if ((st = (_iconv_st *)malloc(sizeof(_iconv_st))) == NULL) {
errno = ENOMEM;
return ((void *) -1);
}
st->_errno = 0;
return ((void *) st);
}
void
_icv_close(_iconv_st *st)
{
if (!st)
errno = EBADF;
else
free(st);
}
size_t
_icv_iconv(_iconv_st *st, char **inbuf, size_t *inbytesleft,
char **outbuf, size_t *outbytesleft)
{
int utf8_len = 1;
int no_id_char_num = 0;
unsigned char *op = (unsigned char*)*inbuf;
#ifdef DEBUG
fprintf(stderr, "========== iconv(): UCS-2 --> TCVN5712 ==========\n");
#endif
if (st == NULL) {
errno = EBADF;
return ((size_t) -1);
}
if (inbuf == NULL || *inbuf == NULL) {
st->_errno = 0;
return ((size_t) 0);
}
st->_errno = 0;
errno = 0;
while (*inbytesleft > 0 && *outbytesleft > 0) {
unsigned long uni = 0;
unsigned char ch = 0;
unsigned long temp1 = 0,
temp2 = 0,
temp3 = 0;
if(0x00 == (*op & 0x80)) {
uni = (unsigned short)*op;
utf8_len = 1;
goto conving;
}
if (*inbytesleft < 2)
goto errexit;
if ( 0xc0 == (*op & 0xe0) &&
0x80 == (*(op + 1) & 0xc0) ) {
temp1 = (unsigned short)(*op & 0x1f);
temp1 <<= 6;
temp1 |= (unsigned short)(*(op + 1) & 0x3f);
uni = temp1;
utf8_len = 2;
goto conving;
}
if (*inbytesleft < 3)
goto errexit;
if ( 0xe0 == (*op & 0xf0) &&
0x80 == (*(op + 1) & 0xc0) &&
0x80 == (*(op + 2) & 0xc0) ) {
temp1 = (unsigned short)(*op &0x0f);
temp1 <<= 12;
temp2 = (unsigned short)(*(op+1) & 0x3F);
temp2 <<= 6;
temp1 = temp1 | temp2 | (unsigned short)(*(op+2) & 0x3F);
uni = temp1;
utf8_len = 3;
goto conving;
}
if (*inbytesleft < 4)
goto errexit;
if ( 0xf0 == (*op & 0xf8) &&
0x80 == (*(op + 1) & 0xc0) &&
0x80 == (*(op + 2) & 0xc0) ) {
temp1 = *op &0x07;
temp1 <<= 18;
temp2 = (*(op+1) & 0x3F);
temp2 <<= 12;
temp3 = (*(op+1) & 0x3F);
temp3 <<= 6;
temp1 = temp1 | temp2 | temp3 |(unsigned long)(*(op+2) & 0x3F);
uni = temp1;
utf8_len = 4;
goto conving;
}
st->_errno = errno = EILSEQ;
errno = EILSEQ;
return ((size_t)-1);
conving:
if (uni_2_tcvn(uni, &ch) == 1) {
**outbuf = ch;
} else {
**outbuf = NON_ID_CHAR;
no_id_char_num += 1;
}
(*outbuf) += 1;
(*outbytesleft) -= 1;
op += utf8_len;
(*inbytesleft) -= utf8_len;
}
return ((size_t)no_id_char_num);
errexit:
st->_errno = errno = EINVAL;
errno = EINVAL;
return ((size_t)-1);
}