PostgreSQL Source Code git master
All Data Structures Namespaces Files Functions Variables Typedefs Enumerations Enumerator Macros Pages
euc_cn_and_mic.c
Go to the documentation of this file.
1/*-------------------------------------------------------------------------
2 *
3 * EUC_CN and MULE_INTERNAL
4 *
5 * Portions Copyright (c) 1996-2025, PostgreSQL Global Development Group
6 * Portions Copyright (c) 1994, Regents of the University of California
7 *
8 * IDENTIFICATION
9 * src/backend/utils/mb/conversion_procs/euc_cn_and_mic/euc_cn_and_mic.c
10 *
11 *-------------------------------------------------------------------------
12 */
13
14#include "postgres.h"
15#include "fmgr.h"
16#include "mb/pg_wchar.h"
17
19
22
23/* ----------
24 * conv_proc(
25 * INTEGER, -- source encoding id
26 * INTEGER, -- destination encoding id
27 * CSTRING, -- source string (null terminated C string)
28 * CSTRING, -- destination string (null terminated C string)
29 * INTEGER, -- source string length
30 * BOOL -- if true, don't throw an error if conversion fails
31 * ) returns INTEGER;
32 *
33 * Returns the number of bytes successfully converted.
34 * ----------
35 */
36
37static int euc_cn2mic(const unsigned char *euc, unsigned char *p, int len, bool noError);
38static int mic2euc_cn(const unsigned char *mic, unsigned char *p, int len, bool noError);
39
42{
43 unsigned char *src = (unsigned char *) PG_GETARG_CSTRING(2);
44 unsigned char *dest = (unsigned char *) PG_GETARG_CSTRING(3);
45 int len = PG_GETARG_INT32(4);
46 bool noError = PG_GETARG_BOOL(5);
47 int converted;
48
50
51 converted = euc_cn2mic(src, dest, len, noError);
52
53 PG_RETURN_INT32(converted);
54}
55
58{
59 unsigned char *src = (unsigned char *) PG_GETARG_CSTRING(2);
60 unsigned char *dest = (unsigned char *) PG_GETARG_CSTRING(3);
61 int len = PG_GETARG_INT32(4);
62 bool noError = PG_GETARG_BOOL(5);
63 int converted;
64
66
67 converted = mic2euc_cn(src, dest, len, noError);
68
69 PG_RETURN_INT32(converted);
70}
71
72/*
73 * EUC_CN ---> MIC
74 */
75static int
76euc_cn2mic(const unsigned char *euc, unsigned char *p, int len, bool noError)
77{
78 const unsigned char *start = euc;
79 int c1;
80
81 while (len > 0)
82 {
83 c1 = *euc;
84 if (IS_HIGHBIT_SET(c1))
85 {
86 if (len < 2 || !IS_HIGHBIT_SET(euc[1]))
87 {
88 if (noError)
89 break;
90 report_invalid_encoding(PG_EUC_CN, (const char *) euc, len);
91 }
92 *p++ = LC_GB2312_80;
93 *p++ = c1;
94 *p++ = euc[1];
95 euc += 2;
96 len -= 2;
97 }
98 else
99 { /* should be ASCII */
100 if (c1 == 0)
101 {
102 if (noError)
103 break;
104 report_invalid_encoding(PG_EUC_CN, (const char *) euc, len);
105 }
106 *p++ = c1;
107 euc++;
108 len--;
109 }
110 }
111 *p = '\0';
112
113 return euc - start;
114}
115
116/*
117 * MIC ---> EUC_CN
118 */
119static int
120mic2euc_cn(const unsigned char *mic, unsigned char *p, int len, bool noError)
121{
122 const unsigned char *start = mic;
123 int c1;
124
125 while (len > 0)
126 {
127 c1 = *mic;
128 if (IS_HIGHBIT_SET(c1))
129 {
130 if (c1 != LC_GB2312_80)
131 {
132 if (noError)
133 break;
135 (const char *) mic, len);
136 }
137 if (len < 3 || !IS_HIGHBIT_SET(mic[1]) || !IS_HIGHBIT_SET(mic[2]))
138 {
139 if (noError)
140 break;
142 (const char *) mic, len);
143 }
144 mic++;
145 *p++ = *mic++;
146 *p++ = *mic++;
147 len -= 3;
148 }
149 else
150 { /* should be ASCII */
151 if (c1 == 0)
152 {
153 if (noError)
154 break;
156 (const char *) mic, len);
157 }
158 *p++ = c1;
159 mic++;
160 len--;
161 }
162 }
163 *p = '\0';
164
165 return mic - start;
166}
#define IS_HIGHBIT_SET(ch)
Definition: c.h:1126
Datum mic_to_euc_cn(PG_FUNCTION_ARGS)
PG_FUNCTION_INFO_V1(euc_cn_to_mic)
PG_MODULE_MAGIC
static int mic2euc_cn(const unsigned char *mic, unsigned char *p, int len, bool noError)
Datum euc_cn_to_mic(PG_FUNCTION_ARGS)
static int euc_cn2mic(const unsigned char *euc, unsigned char *p, int len, bool noError)
#define PG_GETARG_CSTRING(n)
Definition: fmgr.h:277
#define PG_RETURN_INT32(x)
Definition: fmgr.h:354
#define PG_GETARG_INT32(n)
Definition: fmgr.h:269
#define PG_GETARG_BOOL(n)
Definition: fmgr.h:274
#define PG_FUNCTION_ARGS
Definition: fmgr.h:193
return str start
void report_untranslatable_char(int src_encoding, int dest_encoding, const char *mbstr, int len)
Definition: mbutils.c:1730
void report_invalid_encoding(int encoding, const char *mbstr, int len)
Definition: mbutils.c:1698
const void size_t len
@ PG_MULE_INTERNAL
Definition: pg_wchar.h:233
@ PG_EUC_CN
Definition: pg_wchar.h:228
#define CHECK_ENCODING_CONVERSION_ARGS(srcencoding, destencoding)
Definition: pg_wchar.h:507
#define LC_GB2312_80
Definition: pg_wchar.h:133
uintptr_t Datum
Definition: postgres.h:69