Header And Logo

PostgreSQL
| The world's most advanced open source database.

Defines | Functions | Variables

euc_tw_and_big5.c File Reference

#include "postgres.h"
#include "fmgr.h"
#include "mb/pg_wchar.h"
Include dependency graph for euc_tw_and_big5.c:

Go to the source code of this file.

Defines

#define ENCODING_GROWTH_RATE   4

Functions

 PG_FUNCTION_INFO_V1 (euc_tw_to_big5)
 PG_FUNCTION_INFO_V1 (big5_to_euc_tw)
 PG_FUNCTION_INFO_V1 (euc_tw_to_mic)
 PG_FUNCTION_INFO_V1 (mic_to_euc_tw)
 PG_FUNCTION_INFO_V1 (big5_to_mic)
 PG_FUNCTION_INFO_V1 (mic_to_big5)
Datum euc_tw_to_big5 (PG_FUNCTION_ARGS)
Datum big5_to_euc_tw (PG_FUNCTION_ARGS)
Datum euc_tw_to_mic (PG_FUNCTION_ARGS)
Datum mic_to_euc_tw (PG_FUNCTION_ARGS)
Datum big5_to_mic (PG_FUNCTION_ARGS)
Datum mic_to_big5 (PG_FUNCTION_ARGS)
static void big52mic (const unsigned char *big5, unsigned char *p, int len)
static void mic2big5 (const unsigned char *mic, unsigned char *p, int len)
static void euc_tw2mic (const unsigned char *euc, unsigned char *p, int len)
static void mic2euc_tw (const unsigned char *mic, unsigned char *p, int len)

Variables

 PG_MODULE_MAGIC

Define Documentation

#define ENCODING_GROWTH_RATE   4

Definition at line 18 of file euc_tw_and_big5.c.

Referenced by big5_to_euc_tw(), and euc_tw_to_big5().


Function Documentation

static void big52mic ( const unsigned char *  big5,
unsigned char *  p,
int  len 
) [static]

Definition at line 260 of file euc_tw_and_big5.c.

References BIG5toCNS(), IS_HIGHBIT_SET, LC_CNS11643_3, LC_CNS11643_4, PG_BIG5, pg_encoding_verifymb(), PG_MULE_INTERNAL, report_invalid_encoding(), and report_untranslatable_char().

Referenced by big5_to_euc_tw(), and big5_to_mic().

{
    unsigned short c1;
    unsigned short big5buf,
                cnsBuf;
    unsigned char lc;
    int         l;

    while (len > 0)
    {
        c1 = *big5;
        if (!IS_HIGHBIT_SET(c1))
        {
            /* ASCII */
            if (c1 == 0)
                report_invalid_encoding(PG_BIG5,
                                        (const char *) big5, len);
            *p++ = c1;
            big5++;
            len--;
            continue;
        }
        l = pg_encoding_verifymb(PG_BIG5, (const char *) big5, len);
        if (l < 0)
            report_invalid_encoding(PG_BIG5,
                                    (const char *) big5, len);
        big5buf = (c1 << 8) | big5[1];
        cnsBuf = BIG5toCNS(big5buf, &lc);
        if (lc != 0)
        {
            /* Planes 3 and 4 are MULE private charsets */
            if (lc == LC_CNS11643_3 || lc == LC_CNS11643_4)
                *p++ = LCPRV2_B;
            *p++ = lc;          /* Plane No. */
            *p++ = (cnsBuf >> 8) & 0x00ff;
            *p++ = cnsBuf & 0x00ff;
        }
        else
            report_untranslatable_char(PG_BIG5, PG_MULE_INTERNAL,
                                       (const char *) big5, len);
        big5 += l;
        len -= l;
    }
    *p = '\0';
}

Datum big5_to_euc_tw ( PG_FUNCTION_ARGS   ) 

Definition at line 71 of file euc_tw_and_big5.c.

References big52mic(), buf, CHECK_ENCODING_CONVERSION_ARGS, ENCODING_GROWTH_RATE, mic2euc_tw(), palloc(), pfree(), PG_BIG5, PG_EUC_TW, PG_GETARG_CSTRING, PG_GETARG_INT32, and PG_RETURN_VOID.

{
    unsigned char *src = (unsigned char *) PG_GETARG_CSTRING(2);
    unsigned char *dest = (unsigned char *) PG_GETARG_CSTRING(3);
    int         len = PG_GETARG_INT32(4);
    unsigned char *buf;

    CHECK_ENCODING_CONVERSION_ARGS(PG_BIG5, PG_EUC_TW);

    buf = palloc(len * ENCODING_GROWTH_RATE + 1);
    big52mic(src, buf, len);
    mic2euc_tw(buf, dest, strlen((char *) buf));
    pfree(buf);

    PG_RETURN_VOID();
}

Datum big5_to_mic ( PG_FUNCTION_ARGS   ) 

Definition at line 117 of file euc_tw_and_big5.c.

References big52mic(), CHECK_ENCODING_CONVERSION_ARGS, PG_BIG5, PG_GETARG_CSTRING, PG_GETARG_INT32, PG_MULE_INTERNAL, and PG_RETURN_VOID.

{
    unsigned char *src = (unsigned char *) PG_GETARG_CSTRING(2);
    unsigned char *dest = (unsigned char *) PG_GETARG_CSTRING(3);
    int         len = PG_GETARG_INT32(4);

    CHECK_ENCODING_CONVERSION_ARGS(PG_BIG5, PG_MULE_INTERNAL);

    big52mic(src, dest, len);

    PG_RETURN_VOID();
}

static void euc_tw2mic ( const unsigned char *  euc,
unsigned char *  p,
int  len 
) [static]

Definition at line 148 of file euc_tw_and_big5.c.

References IS_HIGHBIT_SET, pg_encoding_verifymb(), PG_EUC_TW, report_invalid_encoding(), and SS2.

Referenced by euc_tw_to_big5(), and euc_tw_to_mic().

{
    int         c1;
    int         l;

    while (len > 0)
    {
        c1 = *euc;
        if (IS_HIGHBIT_SET(c1))
        {
            l = pg_encoding_verifymb(PG_EUC_TW, (const char *) euc, len);
            if (l < 0)
                report_invalid_encoding(PG_EUC_TW,
                                        (const char *) euc, len);
            if (c1 == SS2)
            {
                c1 = euc[1];    /* plane No. */
                if (c1 == 0xa1)
                    *p++ = LC_CNS11643_1;
                else if (c1 == 0xa2)
                    *p++ = LC_CNS11643_2;
                else
                {
                    /* other planes are MULE private charsets */
                    *p++ = LCPRV2_B;
                    *p++ = c1 - 0xa3 + LC_CNS11643_3;
                }
                *p++ = euc[2];
                *p++ = euc[3];
            }
            else
            {                   /* CNS11643-1 */
                *p++ = LC_CNS11643_1;
                *p++ = c1;
                *p++ = euc[1];
            }
            euc += l;
            len -= l;
        }
        else
        {                       /* should be ASCII */
            if (c1 == 0)
                report_invalid_encoding(PG_EUC_TW,
                                        (const char *) euc, len);
            *p++ = c1;
            euc++;
            len--;
        }
    }
    *p = '\0';
}

Datum euc_tw_to_big5 ( PG_FUNCTION_ARGS   ) 

Definition at line 53 of file euc_tw_and_big5.c.

References buf, CHECK_ENCODING_CONVERSION_ARGS, ENCODING_GROWTH_RATE, euc_tw2mic(), mic2big5(), palloc(), pfree(), PG_BIG5, PG_EUC_TW, PG_GETARG_CSTRING, PG_GETARG_INT32, and PG_RETURN_VOID.

{
    unsigned char *src = (unsigned char *) PG_GETARG_CSTRING(2);
    unsigned char *dest = (unsigned char *) PG_GETARG_CSTRING(3);
    int         len = PG_GETARG_INT32(4);
    unsigned char *buf;

    CHECK_ENCODING_CONVERSION_ARGS(PG_EUC_TW, PG_BIG5);

    buf = palloc(len * ENCODING_GROWTH_RATE + 1);
    euc_tw2mic(src, buf, len);
    mic2big5(buf, dest, strlen((char *) buf));
    pfree(buf);

    PG_RETURN_VOID();
}

Datum euc_tw_to_mic ( PG_FUNCTION_ARGS   ) 

Definition at line 89 of file euc_tw_and_big5.c.

References CHECK_ENCODING_CONVERSION_ARGS, euc_tw2mic(), PG_EUC_TW, PG_GETARG_CSTRING, PG_GETARG_INT32, PG_MULE_INTERNAL, and PG_RETURN_VOID.

{
    unsigned char *src = (unsigned char *) PG_GETARG_CSTRING(2);
    unsigned char *dest = (unsigned char *) PG_GETARG_CSTRING(3);
    int         len = PG_GETARG_INT32(4);

    CHECK_ENCODING_CONVERSION_ARGS(PG_EUC_TW, PG_MULE_INTERNAL);

    euc_tw2mic(src, dest, len);

    PG_RETURN_VOID();
}

static void mic2big5 ( const unsigned char *  mic,
unsigned char *  p,
int  len 
) [static]

Definition at line 310 of file euc_tw_and_big5.c.

References CNStoBIG5(), IS_HIGHBIT_SET, LC_CNS11643_1, LC_CNS11643_2, LCPRV2_B, PG_BIG5, pg_encoding_verifymb(), PG_MULE_INTERNAL, report_invalid_encoding(), and report_untranslatable_char().

Referenced by euc_tw_to_big5(), and mic_to_big5().

{
    unsigned short c1;
    unsigned short big5buf,
                cnsBuf;
    int         l;

    while (len > 0)
    {
        c1 = *mic;
        if (!IS_HIGHBIT_SET(c1))
        {
            /* ASCII */
            if (c1 == 0)
                report_invalid_encoding(PG_MULE_INTERNAL,
                                        (const char *) mic, len);
            *p++ = c1;
            mic++;
            len--;
            continue;
        }
        l = pg_encoding_verifymb(PG_MULE_INTERNAL, (const char *) mic, len);
        if (l < 0)
            report_invalid_encoding(PG_MULE_INTERNAL,
                                    (const char *) mic, len);
        if (c1 == LC_CNS11643_1 || c1 == LC_CNS11643_2 || c1 == LCPRV2_B)
        {
            if (c1 == LCPRV2_B)
            {
                c1 = mic[1];    /* get plane no. */
                cnsBuf = (mic[2] << 8) | mic[3];
            }
            else
            {
                cnsBuf = (mic[1] << 8) | mic[2];
            }
            big5buf = CNStoBIG5(cnsBuf, c1);
            if (big5buf == 0)
                report_untranslatable_char(PG_MULE_INTERNAL, PG_BIG5,
                                           (const char *) mic, len);
            *p++ = (big5buf >> 8) & 0x00ff;
            *p++ = big5buf & 0x00ff;
        }
        else
            report_untranslatable_char(PG_MULE_INTERNAL, PG_BIG5,
                                       (const char *) mic, len);
        mic += l;
        len -= l;
    }
    *p = '\0';
}

static void mic2euc_tw ( const unsigned char *  mic,
unsigned char *  p,
int  len 
) [static]

Definition at line 204 of file euc_tw_and_big5.c.

References IS_HIGHBIT_SET, LC_CNS11643_1, LC_CNS11643_2, LC_CNS11643_3, LC_CNS11643_7, LCPRV2_B, pg_encoding_verifymb(), PG_EUC_TW, PG_MULE_INTERNAL, report_invalid_encoding(), and report_untranslatable_char().

Referenced by big5_to_euc_tw(), and mic_to_euc_tw().

{
    int         c1;
    int         l;

    while (len > 0)
    {
        c1 = *mic;
        if (!IS_HIGHBIT_SET(c1))
        {
            /* ASCII */
            if (c1 == 0)
                report_invalid_encoding(PG_MULE_INTERNAL,
                                        (const char *) mic, len);
            *p++ = c1;
            mic++;
            len--;
            continue;
        }
        l = pg_encoding_verifymb(PG_MULE_INTERNAL, (const char *) mic, len);
        if (l < 0)
            report_invalid_encoding(PG_MULE_INTERNAL,
                                    (const char *) mic, len);
        if (c1 == LC_CNS11643_1)
        {
            *p++ = mic[1];
            *p++ = mic[2];
        }
        else if (c1 == LC_CNS11643_2)
        {
            *p++ = SS2;
            *p++ = 0xa2;
            *p++ = mic[1];
            *p++ = mic[2];
        }
        else if (c1 == LCPRV2_B &&
                 mic[1] >= LC_CNS11643_3 && mic[1] <= LC_CNS11643_7)
        {
            *p++ = SS2;
            *p++ = mic[1] - LC_CNS11643_3 + 0xa3;
            *p++ = mic[2];
            *p++ = mic[3];
        }
        else
            report_untranslatable_char(PG_MULE_INTERNAL, PG_EUC_TW,
                                       (const char *) mic, len);
        mic += l;
        len -= l;
    }
    *p = '\0';
}

Datum mic_to_big5 ( PG_FUNCTION_ARGS   ) 

Definition at line 131 of file euc_tw_and_big5.c.

References CHECK_ENCODING_CONVERSION_ARGS, mic2big5(), PG_BIG5, PG_GETARG_CSTRING, PG_GETARG_INT32, PG_MULE_INTERNAL, and PG_RETURN_VOID.

{
    unsigned char *src = (unsigned char *) PG_GETARG_CSTRING(2);
    unsigned char *dest = (unsigned char *) PG_GETARG_CSTRING(3);
    int         len = PG_GETARG_INT32(4);

    CHECK_ENCODING_CONVERSION_ARGS(PG_MULE_INTERNAL, PG_BIG5);

    mic2big5(src, dest, len);

    PG_RETURN_VOID();
}

Datum mic_to_euc_tw ( PG_FUNCTION_ARGS   ) 

Definition at line 103 of file euc_tw_and_big5.c.

References CHECK_ENCODING_CONVERSION_ARGS, mic2euc_tw(), PG_EUC_TW, PG_GETARG_CSTRING, PG_GETARG_INT32, PG_MULE_INTERNAL, and PG_RETURN_VOID.

{
    unsigned char *src = (unsigned char *) PG_GETARG_CSTRING(2);
    unsigned char *dest = (unsigned char *) PG_GETARG_CSTRING(3);
    int         len = PG_GETARG_INT32(4);

    CHECK_ENCODING_CONVERSION_ARGS(PG_MULE_INTERNAL, PG_EUC_TW);

    mic2euc_tw(src, dest, len);

    PG_RETURN_VOID();
}

PG_FUNCTION_INFO_V1 ( euc_tw_to_mic   ) 
PG_FUNCTION_INFO_V1 ( mic_to_euc_tw   ) 
PG_FUNCTION_INFO_V1 ( big5_to_mic   ) 
PG_FUNCTION_INFO_V1 ( mic_to_big5   ) 
PG_FUNCTION_INFO_V1 ( big5_to_euc_tw   ) 
PG_FUNCTION_INFO_V1 ( euc_tw_to_big5   ) 

Variable Documentation

Definition at line 20 of file euc_tw_and_big5.c.