PostgreSQL Source Code git master
Loading...
Searching...
No Matches
encnames.c File Reference
#include "c.h"
#include <ctype.h>
#include <unistd.h>
#include "mb/pg_wchar.h"
Include dependency graph for encnames.c:

Go to the source code of this file.

Data Structures

struct  pg_encname
 

Macros

#define DEF_ENC2NAME(name, codepage)   { #name, PG_##name }
 

Typedefs

typedef struct pg_encname pg_encname
 

Functions

 StaticAssertDecl (lengthof(pg_enc2icu_tbl)==PG_ENCODING_BE_LAST+1, "pg_enc2icu_tbl incomplete")
 
bool is_encoding_supported_by_icu (int encoding)
 
const charget_encoding_name_for_icu (int encoding)
 
int pg_valid_client_encoding (const char *name)
 
int pg_valid_server_encoding (const char *name)
 
int pg_valid_server_encoding_id (int encoding)
 
static charclean_encoding_name (const char *key, char *newkey)
 
int pg_char_to_encoding (const char *name)
 
const charpg_encoding_to_char (int encoding)
 

Variables

static const pg_encname pg_encname_tbl []
 
const pg_enc2name pg_enc2name_tbl []
 
const charpg_enc2gettext_tbl []
 
static const char *const pg_enc2icu_tbl []
 

Macro Definition Documentation

◆ DEF_ENC2NAME

#define DEF_ENC2NAME (   name,
  codepage 
)    { #name, PG_##name }

Definition at line 303 of file encnames.c.

Typedef Documentation

◆ pg_encname

Function Documentation

◆ clean_encoding_name()

static char * clean_encoding_name ( const char key,
char newkey 
)
static

Definition at line 524 of file encnames.c.

525{
526 const char *p;
527 char *np;
528
529 for (p = key, np = newkey; *p != '\0'; p++)
530 {
531 if (isalnum((unsigned char) *p))
532 {
533 if (*p >= 'A' && *p <= 'Z')
534 *np++ = *p + 'a' - 'A';
535 else
536 *np++ = *p;
537 }
538 }
539 *np = '\0';
540 return newkey;
541}
static int fb(int x)

References fb().

Referenced by pg_char_to_encoding().

◆ get_encoding_name_for_icu()

const char * get_encoding_name_for_icu ( int  encoding)

Definition at line 472 of file encnames.c.

473{
475 return NULL;
476 return pg_enc2icu_tbl[encoding];
477}
static const char *const pg_enc2icu_tbl[]
Definition encnames.c:414
static char * encoding
Definition initdb.c:139
#define PG_VALID_BE_ENCODING(_enc)
Definition pg_wchar.h:281

References encoding, fb(), pg_enc2icu_tbl, and PG_VALID_BE_ENCODING.

◆ is_encoding_supported_by_icu()

bool is_encoding_supported_by_icu ( int  encoding)

Definition at line 461 of file encnames.c.

462{
464 return false;
465 return (pg_enc2icu_tbl[encoding] != NULL);
466}

References encoding, fb(), pg_enc2icu_tbl, and PG_VALID_BE_ENCODING.

Referenced by check_icu_locale_encoding(), createdb(), DefineCollation(), and lookup_collation().

◆ pg_char_to_encoding()

int pg_char_to_encoding ( const char name)

Definition at line 549 of file encnames.c.

550{
551 unsigned int nel = lengthof(pg_encname_tbl);
552 const pg_encname *base = pg_encname_tbl,
553 *last = base + nel - 1,
554 *position;
555 int result;
556 char buff[NAMEDATALEN],
557 *key;
558
559 if (name == NULL || *name == '\0')
560 return -1;
561
562 if (strlen(name) >= NAMEDATALEN)
563 return -1; /* it's certainly not in the table */
564
566
567 while (last >= base)
568 {
569 position = base + ((last - base) >> 1);
570 result = key[0] - position->name[0];
571
572 if (result == 0)
573 {
574 result = strcmp(key, position->name);
575 if (result == 0)
576 return position->encoding;
577 }
578 if (result < 0)
579 last = position - 1;
580 else
581 base = position + 1;
582 }
583 return -1;
584}
#define lengthof(array)
Definition c.h:803
static char * clean_encoding_name(const char *key, char *newkey)
Definition encnames.c:524
static const pg_encname pg_encname_tbl[]
Definition encnames.c:39
#define NAMEDATALEN
const char * name

References clean_encoding_name(), fb(), lengthof, name, NAMEDATALEN, and pg_encname_tbl.

◆ pg_encoding_to_char()

const char * pg_encoding_to_char ( int  encoding)

Definition at line 587 of file encnames.c.

588{
590 {
592
593 Assert(encoding == p->encoding);
594 return p->name;
595 }
596 return "";
597}
#define Assert(condition)
Definition c.h:873
const pg_enc2name pg_enc2name_tbl[]
Definition encnames.c:308
#define PG_VALID_ENCODING(_enc)
Definition pg_wchar.h:287
pg_enc encoding
Definition pg_wchar.h:342
const char * name
Definition pg_wchar.h:341

References Assert, encoding, pg_enc2name::encoding, pg_enc2name::name, pg_enc2name_tbl, and PG_VALID_ENCODING.

◆ pg_valid_client_encoding()

int pg_valid_client_encoding ( const char name)

Definition at line 485 of file encnames.c.

486{
487 int enc;
488
489 if ((enc = pg_char_to_encoding(name)) < 0)
490 return -1;
491
493 return -1;
494
495 return enc;
496}
#define PG_VALID_FE_ENCODING(_enc)
Definition pg_wchar.h:291
#define pg_char_to_encoding
Definition pg_wchar.h:629

References enc, name, pg_char_to_encoding, and PG_VALID_FE_ENCODING.

Referenced by check_client_encoding().

◆ pg_valid_server_encoding()

int pg_valid_server_encoding ( const char name)

Definition at line 499 of file encnames.c.

500{
501 int enc;
502
503 if ((enc = pg_char_to_encoding(name)) < 0)
504 return -1;
505
507 return -1;
508
509 return enc;
510}

References enc, name, pg_char_to_encoding, and PG_VALID_BE_ENCODING.

◆ pg_valid_server_encoding_id()

int pg_valid_server_encoding_id ( int  encoding)

Definition at line 513 of file encnames.c.

514{
516}

References encoding, and PG_VALID_BE_ENCODING.

◆ StaticAssertDecl()

StaticAssertDecl ( lengthof(pg_enc2icu_tbl = =PG_ENCODING_BE_LAST+1,
"pg_enc2icu_tbl incomplete"   
)

Variable Documentation

◆ pg_enc2gettext_tbl

const char* pg_enc2gettext_tbl[]

Definition at line 360 of file encnames.c.

361{
362 [PG_SQL_ASCII] = "US-ASCII",
363 [PG_UTF8] = "UTF-8",
365 [PG_LATIN1] = "LATIN1",
366 [PG_LATIN2] = "LATIN2",
367 [PG_LATIN3] = "LATIN3",
368 [PG_LATIN4] = "LATIN4",
369 [PG_ISO_8859_5] = "ISO-8859-5",
370 [PG_ISO_8859_6] = "ISO_8859-6",
371 [PG_ISO_8859_7] = "ISO-8859-7",
372 [PG_ISO_8859_8] = "ISO-8859-8",
373 [PG_LATIN5] = "LATIN5",
374 [PG_LATIN6] = "LATIN6",
375 [PG_LATIN7] = "LATIN7",
376 [PG_LATIN8] = "LATIN8",
377 [PG_LATIN9] = "LATIN-9",
378 [PG_LATIN10] = "LATIN10",
379 [PG_KOI8R] = "KOI8-R",
380 [PG_KOI8U] = "KOI8-U",
381 [PG_WIN1250] = "CP1250",
382 [PG_WIN1251] = "CP1251",
383 [PG_WIN1252] = "CP1252",
384 [PG_WIN1253] = "CP1253",
385 [PG_WIN1254] = "CP1254",
386 [PG_WIN1255] = "CP1255",
387 [PG_WIN1256] = "CP1256",
388 [PG_WIN1257] = "CP1257",
389 [PG_WIN1258] = "CP1258",
390 [PG_WIN866] = "CP866",
391 [PG_WIN874] = "CP874",
392 [PG_EUC_CN] = "EUC-CN",
393 [PG_EUC_JP] = "EUC-JP",
394 [PG_EUC_KR] = "EUC-KR",
395 [PG_EUC_TW] = "EUC-TW",
396 [PG_EUC_JIS_2004] = "EUC-JP",
397 [PG_SJIS] = "SHIFT-JIS",
398 [PG_BIG5] = "BIG5",
399 [PG_GBK] = "GBK",
400 [PG_UHC] = "UHC",
401 [PG_GB18030] = "GB18030",
402 [PG_JOHAB] = "JOHAB",
403 [PG_SHIFT_JIS_2004] = "SHIFT_JISX0213",
404};
#define PG_UTF8
Definition mbprint.c:43
@ PG_WIN1254
Definition pg_wchar.h:257
@ PG_LATIN4
Definition pg_wchar.h:237
@ PG_LATIN9
Definition pg_wchar.h:242
@ PG_JOHAB
Definition pg_wchar.h:269
@ PG_GB18030
Definition pg_wchar.h:268
@ PG_SQL_ASCII
Definition pg_wchar.h:226
@ PG_KOI8R
Definition pg_wchar.h:248
@ PG_ISO_8859_6
Definition pg_wchar.h:252
@ PG_WIN1253
Definition pg_wchar.h:256
@ PG_KOI8U
Definition pg_wchar.h:260
@ PG_LATIN6
Definition pg_wchar.h:239
@ PG_MULE_INTERNAL
Definition pg_wchar.h:233
@ PG_LATIN5
Definition pg_wchar.h:238
@ PG_EUC_CN
Definition pg_wchar.h:228
@ PG_UHC
Definition pg_wchar.h:267
@ PG_LATIN2
Definition pg_wchar.h:235
@ PG_ISO_8859_5
Definition pg_wchar.h:251
@ PG_LATIN10
Definition pg_wchar.h:243
@ PG_WIN1250
Definition pg_wchar.h:255
@ PG_ISO_8859_7
Definition pg_wchar.h:253
@ PG_SJIS
Definition pg_wchar.h:264
@ PG_LATIN8
Definition pg_wchar.h:241
@ PG_EUC_JP
Definition pg_wchar.h:227
@ PG_GBK
Definition pg_wchar.h:266
@ PG_LATIN3
Definition pg_wchar.h:236
@ PG_WIN1256
Definition pg_wchar.h:244
@ PG_LATIN1
Definition pg_wchar.h:234
@ PG_EUC_TW
Definition pg_wchar.h:230
@ PG_WIN1258
Definition pg_wchar.h:245
@ PG_SHIFT_JIS_2004
Definition pg_wchar.h:270
@ PG_WIN1252
Definition pg_wchar.h:250
@ PG_LATIN7
Definition pg_wchar.h:240
@ PG_WIN1255
Definition pg_wchar.h:258
@ PG_WIN1257
Definition pg_wchar.h:259
@ PG_WIN1251
Definition pg_wchar.h:249
@ PG_EUC_KR
Definition pg_wchar.h:229
@ PG_WIN866
Definition pg_wchar.h:246
@ PG_ISO_8859_8
Definition pg_wchar.h:254
@ PG_WIN874
Definition pg_wchar.h:247
@ PG_EUC_JIS_2004
Definition pg_wchar.h:231
@ PG_BIG5
Definition pg_wchar.h:265

◆ pg_enc2icu_tbl

const char* const pg_enc2icu_tbl[]
static

Definition at line 414 of file encnames.c.

415{
416 [PG_SQL_ASCII] = NULL,
417 [PG_EUC_JP] = "EUC-JP",
418 [PG_EUC_CN] = "EUC-CN",
419 [PG_EUC_KR] = "EUC-KR",
420 [PG_EUC_TW] = "EUC-TW",
422 [PG_UTF8] = "UTF-8",
424 [PG_LATIN1] = "ISO-8859-1",
425 [PG_LATIN2] = "ISO-8859-2",
426 [PG_LATIN3] = "ISO-8859-3",
427 [PG_LATIN4] = "ISO-8859-4",
428 [PG_LATIN5] = "ISO-8859-9",
429 [PG_LATIN6] = "ISO-8859-10",
430 [PG_LATIN7] = "ISO-8859-13",
431 [PG_LATIN8] = "ISO-8859-14",
432 [PG_LATIN9] = "ISO-8859-15",
433 [PG_LATIN10] = NULL,
434 [PG_WIN1256] = "CP1256",
435 [PG_WIN1258] = "CP1258",
436 [PG_WIN866] = "CP866",
437 [PG_WIN874] = NULL,
438 [PG_KOI8R] = "KOI8-R",
439 [PG_WIN1251] = "CP1251",
440 [PG_WIN1252] = "CP1252",
441 [PG_ISO_8859_5] = "ISO-8859-5",
442 [PG_ISO_8859_6] = "ISO-8859-6",
443 [PG_ISO_8859_7] = "ISO-8859-7",
444 [PG_ISO_8859_8] = "ISO-8859-8",
445 [PG_WIN1250] = "CP1250",
446 [PG_WIN1253] = "CP1253",
447 [PG_WIN1254] = "CP1254",
448 [PG_WIN1255] = "CP1255",
449 [PG_WIN1257] = "CP1257",
450 [PG_KOI8U] = "KOI8-U",
451};

Referenced by get_encoding_name_for_icu(), and is_encoding_supported_by_icu().

◆ pg_enc2name_tbl

const pg_enc2name pg_enc2name_tbl[]

Definition at line 308 of file encnames.c.

309{
311 [PG_EUC_JP] = DEF_ENC2NAME(EUC_JP, 20932),
312 [PG_EUC_CN] = DEF_ENC2NAME(EUC_CN, 20936),
313 [PG_EUC_KR] = DEF_ENC2NAME(EUC_KR, 51949),
316 [PG_UTF8] = DEF_ENC2NAME(UTF8, 65001),
318 [PG_LATIN1] = DEF_ENC2NAME(LATIN1, 28591),
319 [PG_LATIN2] = DEF_ENC2NAME(LATIN2, 28592),
320 [PG_LATIN3] = DEF_ENC2NAME(LATIN3, 28593),
321 [PG_LATIN4] = DEF_ENC2NAME(LATIN4, 28594),
322 [PG_LATIN5] = DEF_ENC2NAME(LATIN5, 28599),
326 [PG_LATIN9] = DEF_ENC2NAME(LATIN9, 28605),
330 [PG_WIN866] = DEF_ENC2NAME(WIN866, 866),
331 [PG_WIN874] = DEF_ENC2NAME(WIN874, 874),
332 [PG_KOI8R] = DEF_ENC2NAME(KOI8R, 20866),
344 [PG_KOI8U] = DEF_ENC2NAME(KOI8U, 21866),
345 [PG_SJIS] = DEF_ENC2NAME(SJIS, 932),
346 [PG_BIG5] = DEF_ENC2NAME(BIG5, 950),
347 [PG_GBK] = DEF_ENC2NAME(GBK, 936),
348 [PG_UHC] = DEF_ENC2NAME(UHC, 949),
349 [PG_GB18030] = DEF_ENC2NAME(GB18030, 54936),
352};
#define DEF_ENC2NAME(name, codepage)
Definition encnames.c:303

Referenced by check_encoding_conversion_args(), InitializeClientEncoding(), pg_any_to_server(), pg_encoding_to_char(), pg_unicode_to_server(), report_invalid_encoding(), report_untranslatable_char(), SetClientEncoding(), SetDatabaseEncoding(), SetMessageEncoding(), and test_enc_setup().

◆ pg_encname_tbl

const pg_encname pg_encname_tbl[]
static

Definition at line 39 of file encnames.c.

40{
41 {
42 "abc", PG_WIN1258
43 }, /* alias for WIN1258 */
44 {
45 "alt", PG_WIN866
46 }, /* IBM866 */
47 {
48 "big5", PG_BIG5
49 }, /* Big5; Chinese for Taiwan multibyte set */
50 {
51 "euccn", PG_EUC_CN
52 }, /* EUC-CN; Extended Unix Code for simplified
53 * Chinese */
54 {
55 "eucjis2004", PG_EUC_JIS_2004
56 }, /* EUC-JIS-2004; Extended UNIX Code fixed
57 * Width for Japanese, standard JIS X 0213 */
58 {
59 "eucjp", PG_EUC_JP
60 }, /* EUC-JP; Extended UNIX Code fixed Width for
61 * Japanese, standard OSF */
62 {
63 "euckr", PG_EUC_KR
64 }, /* EUC-KR; Extended Unix Code for Korean , KS
65 * X 1001 standard */
66 {
67 "euctw", PG_EUC_TW
68 }, /* EUC-TW; Extended Unix Code for
69 *
70 * traditional Chinese */
71 {
72 "gb18030", PG_GB18030
73 }, /* GB18030;GB18030 */
74 {
75 "gbk", PG_GBK
76 }, /* GBK; Chinese Windows CodePage 936
77 * simplified Chinese */
78 {
79 "iso88591", PG_LATIN1
80 }, /* ISO-8859-1; RFC1345,KXS2 */
81 {
82 "iso885910", PG_LATIN6
83 }, /* ISO-8859-10; RFC1345,KXS2 */
84 {
85 "iso885913", PG_LATIN7
86 }, /* ISO-8859-13; RFC1345,KXS2 */
87 {
88 "iso885914", PG_LATIN8
89 }, /* ISO-8859-14; RFC1345,KXS2 */
90 {
91 "iso885915", PG_LATIN9
92 }, /* ISO-8859-15; RFC1345,KXS2 */
93 {
94 "iso885916", PG_LATIN10
95 }, /* ISO-8859-16; RFC1345,KXS2 */
96 {
97 "iso88592", PG_LATIN2
98 }, /* ISO-8859-2; RFC1345,KXS2 */
99 {
100 "iso88593", PG_LATIN3
101 }, /* ISO-8859-3; RFC1345,KXS2 */
102 {
103 "iso88594", PG_LATIN4
104 }, /* ISO-8859-4; RFC1345,KXS2 */
105 {
106 "iso88595", PG_ISO_8859_5
107 }, /* ISO-8859-5; RFC1345,KXS2 */
108 {
109 "iso88596", PG_ISO_8859_6
110 }, /* ISO-8859-6; RFC1345,KXS2 */
111 {
112 "iso88597", PG_ISO_8859_7
113 }, /* ISO-8859-7; RFC1345,KXS2 */
114 {
115 "iso88598", PG_ISO_8859_8
116 }, /* ISO-8859-8; RFC1345,KXS2 */
117 {
118 "iso88599", PG_LATIN5
119 }, /* ISO-8859-9; RFC1345,KXS2 */
120 {
121 "johab", PG_JOHAB
122 }, /* JOHAB; Extended Unix Code for simplified
123 * Chinese */
124 {
125 "koi8", PG_KOI8R
126 }, /* _dirty_ alias for KOI8-R (backward
127 * compatibility) */
128 {
129 "koi8r", PG_KOI8R
130 }, /* KOI8-R; RFC1489 */
131 {
132 "koi8u", PG_KOI8U
133 }, /* KOI8-U; RFC2319 */
134 {
135 "latin1", PG_LATIN1
136 }, /* alias for ISO-8859-1 */
137 {
138 "latin10", PG_LATIN10
139 }, /* alias for ISO-8859-16 */
140 {
141 "latin2", PG_LATIN2
142 }, /* alias for ISO-8859-2 */
143 {
144 "latin3", PG_LATIN3
145 }, /* alias for ISO-8859-3 */
146 {
147 "latin4", PG_LATIN4
148 }, /* alias for ISO-8859-4 */
149 {
150 "latin5", PG_LATIN5
151 }, /* alias for ISO-8859-9 */
152 {
153 "latin6", PG_LATIN6
154 }, /* alias for ISO-8859-10 */
155 {
156 "latin7", PG_LATIN7
157 }, /* alias for ISO-8859-13 */
158 {
159 "latin8", PG_LATIN8
160 }, /* alias for ISO-8859-14 */
161 {
162 "latin9", PG_LATIN9
163 }, /* alias for ISO-8859-15 */
164 {
165 "mskanji", PG_SJIS
166 }, /* alias for Shift_JIS */
167 {
168 "muleinternal", PG_MULE_INTERNAL
169 },
170 {
171 "shiftjis", PG_SJIS
172 }, /* Shift_JIS; JIS X 0202-1991 */
173
174 {
175 "shiftjis2004", PG_SHIFT_JIS_2004
176 }, /* SHIFT-JIS-2004; Shift JIS for Japanese,
177 * standard JIS X 0213 */
178 {
179 "sjis", PG_SJIS
180 }, /* alias for Shift_JIS */
181 {
182 "sqlascii", PG_SQL_ASCII
183 },
184 {
185 "tcvn", PG_WIN1258
186 }, /* alias for WIN1258 */
187 {
188 "tcvn5712", PG_WIN1258
189 }, /* alias for WIN1258 */
190 {
191 "uhc", PG_UHC
192 }, /* UHC; Korean Windows CodePage 949 */
193 {
194 "unicode", PG_UTF8
195 }, /* alias for UTF8 */
196 {
197 "utf8", PG_UTF8
198 }, /* alias for UTF8 */
199 {
200 "vscii", PG_WIN1258
201 }, /* alias for WIN1258 */
202 {
203 "win", PG_WIN1251
204 }, /* _dirty_ alias for windows-1251 (backward
205 * compatibility) */
206 {
207 "win1250", PG_WIN1250
208 }, /* alias for Windows-1250 */
209 {
210 "win1251", PG_WIN1251
211 }, /* alias for Windows-1251 */
212 {
213 "win1252", PG_WIN1252
214 }, /* alias for Windows-1252 */
215 {
216 "win1253", PG_WIN1253
217 }, /* alias for Windows-1253 */
218 {
219 "win1254", PG_WIN1254
220 }, /* alias for Windows-1254 */
221 {
222 "win1255", PG_WIN1255
223 }, /* alias for Windows-1255 */
224 {
225 "win1256", PG_WIN1256
226 }, /* alias for Windows-1256 */
227 {
228 "win1257", PG_WIN1257
229 }, /* alias for Windows-1257 */
230 {
231 "win1258", PG_WIN1258
232 }, /* alias for Windows-1258 */
233 {
234 "win866", PG_WIN866
235 }, /* IBM866 */
236 {
237 "win874", PG_WIN874
238 }, /* alias for Windows-874 */
239 {
240 "win932", PG_SJIS
241 }, /* alias for Shift_JIS */
242 {
243 "win936", PG_GBK
244 }, /* alias for GBK */
245 {
246 "win949", PG_UHC
247 }, /* alias for UHC */
248 {
249 "win950", PG_BIG5
250 }, /* alias for BIG5 */
251 {
252 "windows1250", PG_WIN1250
253 }, /* Windows-1251; Microsoft */
254 {
255 "windows1251", PG_WIN1251
256 }, /* Windows-1251; Microsoft */
257 {
258 "windows1252", PG_WIN1252
259 }, /* Windows-1252; Microsoft */
260 {
261 "windows1253", PG_WIN1253
262 }, /* Windows-1253; Microsoft */
263 {
264 "windows1254", PG_WIN1254
265 }, /* Windows-1254; Microsoft */
266 {
267 "windows1255", PG_WIN1255
268 }, /* Windows-1255; Microsoft */
269 {
270 "windows1256", PG_WIN1256
271 }, /* Windows-1256; Microsoft */
272 {
273 "windows1257", PG_WIN1257
274 }, /* Windows-1257; Microsoft */
275 {
276 "windows1258", PG_WIN1258
277 }, /* Windows-1258; Microsoft */
278 {
279 "windows866", PG_WIN866
280 }, /* IBM866 */
281 {
282 "windows874", PG_WIN874
283 }, /* Windows-874; Microsoft */
284 {
285 "windows932", PG_SJIS
286 }, /* alias for Shift_JIS */
287 {
288 "windows936", PG_GBK
289 }, /* alias for GBK */
290 {
291 "windows949", PG_UHC
292 }, /* alias for UHC */
293 {
294 "windows950", PG_BIG5
295 } /* alias for BIG5 */
296};

Referenced by pg_char_to_encoding().