PostgreSQL Source Code git master
Loading...
Searching...
No Matches
string_utils.c File Reference
#include "postgres_fe.h"
#include <ctype.h>
#include "common/keywords.h"
#include "fe_utils/string_utils.h"
#include "mb/pg_wchar.h"
Include dependency graph for string_utils.c:

Go to the source code of this file.

Macros

#define WHEREAND()
 

Functions

static PQExpBuffer defaultGetLocalPQExpBuffer (void)
 
void setFmtEncoding (int encoding)
 
static int getFmtEncoding (void)
 
const charfmtIdEnc (const char *rawid, int encoding)
 
const charfmtId (const char *rawid)
 
const charfmtQualifiedIdEnc (const char *schema, const char *id, int encoding)
 
const charfmtQualifiedId (const char *schema, const char *id)
 
charformatPGVersionNumber (int version_number, bool include_minor, char *buf, size_t buflen)
 
void appendStringLiteral (PQExpBuffer buf, const char *str, int encoding, bool std_strings)
 
void appendStringLiteralConn (PQExpBuffer buf, const char *str, PGconn *conn)
 
void appendStringLiteralDQ (PQExpBuffer buf, const char *str, const char *dqprefix)
 
void appendByteaLiteral (PQExpBuffer buf, const unsigned char *str, size_t length, bool std_strings)
 
void appendShellString (PQExpBuffer buf, const char *str)
 
bool appendShellStringNoError (PQExpBuffer buf, const char *str)
 
void appendConnStrVal (PQExpBuffer buf, const char *str)
 
void appendPsqlMetaConnect (PQExpBuffer buf, const char *dbname)
 
bool parsePGArray (const char *atext, char ***itemarray, int *nitems)
 
void appendPGArray (PQExpBuffer buffer, const char *value)
 
bool appendReloptionsArray (PQExpBuffer buffer, const char *reloptions, const char *prefix, int encoding, bool std_strings)
 
bool processSQLNamePattern (PGconn *conn, PQExpBuffer buf, const char *pattern, bool have_where, bool force_escape, const char *schemavar, const char *namevar, const char *altnamevar, const char *visibilityrule, PQExpBuffer dbnamebuf, int *dotcnt)
 
void patternToSQLRegex (int encoding, PQExpBuffer dbnamebuf, PQExpBuffer schemabuf, PQExpBuffer namebuf, const char *pattern, bool force_escape, bool want_literal_dbname, int *dotcnt)
 

Variables

int quote_all_identifiers = 0
 
PQExpBuffer(* getLocalPQExpBuffer )(void)
 

Macro Definition Documentation

◆ WHEREAND

#define WHEREAND ( )
Value:
(appendPQExpBufferStr(buf, have_where ? " AND " : "WHERE "), \
return true
Definition isn.c:130
static char buf[DEFAULT_XLOG_SEG_SIZE]
void appendPQExpBufferStr(PQExpBuffer str, const char *data)
static int fb(int x)

Function Documentation

◆ appendByteaLiteral()

void appendByteaLiteral ( PQExpBuffer  buf,
const unsigned char str,
size_t  length,
bool  std_strings 
)

Definition at line 527 of file string_utils.c.

529{
530 const unsigned char *source = str;
531 char *target;
532
533 static const char hextbl[] = "0123456789abcdef";
534
535 /*
536 * This implementation is hard-wired to produce hex-format output. We do
537 * not know the server version the output will be loaded into, so making
538 * an intelligent format choice is impossible. It might be better to
539 * always use the old escaped format.
540 */
541 if (!enlargePQExpBuffer(buf, 2 * length + 5))
542 return;
543
544 target = buf->data + buf->len;
545 *target++ = '\'';
546 if (!std_strings)
547 *target++ = '\\';
548 *target++ = '\\';
549 *target++ = 'x';
550
551 while (length-- > 0)
552 {
553 unsigned char c = *source++;
554
555 *target++ = hextbl[(c >> 4) & 0xF];
556 *target++ = hextbl[c & 0xF];
557 }
558
559 /* Write the terminating quote and NUL character. */
560 *target++ = '\'';
561 *target = '\0';
562
563 buf->len = target - buf->data;
564}
const char * str
static rewind_source * source
Definition pg_rewind.c:89
static const char hextbl[]
Definition pgp-info.c:87
int enlargePQExpBuffer(PQExpBuffer str, size_t needed)
char * c

References buf, enlargePQExpBuffer(), hextbl, source, and str.

◆ appendConnStrVal()

void appendConnStrVal ( PQExpBuffer  buf,
const char str 
)

Definition at line 696 of file string_utils.c.

697{
698 const char *s;
699 bool needquotes;
700
701 /*
702 * If the string is one or more plain ASCII characters, no need to quote
703 * it. This is quite conservative, but better safe than sorry.
704 */
705 needquotes = true;
706 for (s = str; *s; s++)
707 {
708 if (!((*s >= 'a' && *s <= 'z') || (*s >= 'A' && *s <= 'Z') ||
709 (*s >= '0' && *s <= '9') || *s == '_' || *s == '.'))
710 {
711 needquotes = true;
712 break;
713 }
714 needquotes = false;
715 }
716
717 if (needquotes)
718 {
720 while (*str)
721 {
722 /* ' and \ must be escaped by to \' and \\ */
723 if (*str == '\'' || *str == '\\')
725
727 str++;
728 }
730 }
731 else
733}
void appendPQExpBufferChar(PQExpBuffer str, char ch)

References appendPQExpBufferChar(), appendPQExpBufferStr(), buf, fb(), and str.

Referenced by appendConnStrItem(), appendPsqlMetaConnect(), constructConnStr(), generate_old_dump(), GenerateRecoveryConfig(), get_db_conn(), runPgDump(), and start_conn().

◆ appendPGArray()

void appendPGArray ( PQExpBuffer  buffer,
const char value 
)

Definition at line 900 of file string_utils.c.

901{
902 bool needquote;
903 const char *tmp;
904
905 if (buffer->data[buffer->len - 1] != '{')
906 appendPQExpBufferChar(buffer, ',');
907
908 /* Decide if we need quotes; this should match array_out()'s choices. */
909 if (value[0] == '\0')
910 needquote = true; /* force quotes for empty string */
911 else if (pg_strcasecmp(value, "NULL") == 0)
912 needquote = true; /* force quotes for literal NULL */
913 else
914 needquote = false;
915
916 if (!needquote)
917 {
918 for (tmp = value; *tmp; tmp++)
919 {
920 char ch = *tmp;
921
922 if (ch == '"' || ch == '\\' ||
923 ch == '{' || ch == '}' || ch == ',' ||
924 /* these match scanner_isspace(): */
925 ch == ' ' || ch == '\t' || ch == '\n' ||
926 ch == '\r' || ch == '\v' || ch == '\f')
927 {
928 needquote = true;
929 break;
930 }
931 }
932 }
933
934 if (needquote)
935 {
936 appendPQExpBufferChar(buffer, '"');
937 for (tmp = value; *tmp; tmp++)
938 {
939 char ch = *tmp;
940
941 if (ch == '"' || ch == '\\')
942 appendPQExpBufferChar(buffer, '\\');
943 appendPQExpBufferChar(buffer, ch);
944 }
945 appendPQExpBufferChar(buffer, '"');
946 }
947 else
949}
static struct @175 value
int pg_strcasecmp(const char *s1, const char *s2)

References appendPQExpBufferChar(), appendPQExpBufferStr(), PQExpBufferData::data, fb(), PQExpBufferData::len, pg_strcasecmp(), and value.

Referenced by fetchAttributeStats(), and getNamespaces().

◆ appendPsqlMetaConnect()

void appendPsqlMetaConnect ( PQExpBuffer  buf,
const char dbname 
)

Definition at line 741 of file string_utils.c.

742{
743 const char *s;
744 bool complex;
745
746 /*
747 * If the name is plain ASCII characters, emit a trivial "\connect "foo"".
748 * For other names, even many not technically requiring it, skip to the
749 * general case. No database has a zero-length name.
750 */
751 complex = false;
752
753 for (s = dbname; *s; s++)
754 {
755 if (*s == '\n' || *s == '\r')
756 {
758 _("database name contains a newline or carriage return: \"%s\"\n"),
759 dbname);
761 }
762
763 if (!((*s >= 'a' && *s <= 'z') || (*s >= 'A' && *s <= 'Z') ||
764 (*s >= '0' && *s <= '9') || *s == '_' || *s == '.'))
765 {
766 complex = true;
767 }
768 }
769
770 if (complex)
771 {
773
775
776 /*
777 * Force the target psql's encoding to SQL_ASCII. We don't really
778 * know the encoding of the database name, and it doesn't matter as
779 * long as psql will forward it to the server unchanged.
780 */
781 appendPQExpBufferStr(buf, "\\encoding SQL_ASCII\n");
782 appendPQExpBufferStr(buf, "\\connect -reuse-previous=on ");
783
784 appendPQExpBufferStr(&connstr, "dbname=");
786
787 /*
788 * As long as the name does not contain a newline, SQL identifier
789 * quoting satisfies the psql meta-command parser. Prefer not to
790 * involve psql-interpreted single quotes, which behaved differently
791 * before PostgreSQL 9.2.
792 */
794
796 }
797 else
798 {
799 appendPQExpBufferStr(buf, "\\connect ");
801 }
803}
#define fprintf(file, fmt, msg)
Definition cubescan.l:21
#define _(x)
Definition elog.c:96
static const char * connstr
Definition pg_dumpall.c:82
@ PG_SQL_ASCII
Definition pg_wchar.h:76
void initPQExpBuffer(PQExpBuffer str)
Definition pqexpbuffer.c:90
void termPQExpBuffer(PQExpBuffer str)
#define EXIT_FAILURE
Definition settings.h:197
char * dbname
Definition streamutil.c:49
const char * fmtIdEnc(const char *rawid, int encoding)
void appendConnStrVal(PQExpBuffer buf, const char *str)

References _, appendConnStrVal(), appendPQExpBufferChar(), appendPQExpBufferStr(), buf, connstr, dbname, EXIT_FAILURE, fb(), fmtIdEnc(), fprintf, initPQExpBuffer(), PG_SQL_ASCII, and termPQExpBuffer().

Referenced by _reconnectToDB(), old_9_6_invalidate_hash_indexes(), and process_extension_updates().

◆ appendReloptionsArray()

bool appendReloptionsArray ( PQExpBuffer  buffer,
const char reloptions,
const char prefix,
int  encoding,
bool  std_strings 
)

Definition at line 964 of file string_utils.c.

966{
967 char **options;
968 int noptions;
969 int i;
970
971 if (!parsePGArray(reloptions, &options, &noptions))
972 {
973 free(options);
974 return false;
975 }
976
977 for (i = 0; i < noptions; i++)
978 {
979 char *option = options[i];
980 char *name;
981 char *separator;
982 char *value;
983
984 /*
985 * Each array element should have the form name=value. If the "=" is
986 * missing for some reason, treat it like an empty value.
987 */
988 name = option;
989 separator = strchr(option, '=');
990 if (separator)
991 {
992 *separator = '\0';
993 value = separator + 1;
994 }
995 else
996 value = "";
997
998 if (i > 0)
999 appendPQExpBufferStr(buffer, ", ");
1000 appendPQExpBuffer(buffer, "%s%s=", prefix, fmtId(name));
1001
1002 /*
1003 * In general we need to quote the value; but to avoid unnecessary
1004 * clutter, do not quote if it is an identifier that would not need
1005 * quoting. (We could also allow numbers, but that is a bit trickier
1006 * than it looks --- for example, are leading zeroes significant? We
1007 * don't want to assume very much here about what custom reloptions
1008 * might mean.)
1009 */
1010 if (strcmp(fmtId(value), value) == 0)
1011 appendPQExpBufferStr(buffer, value);
1012 else
1013 appendStringLiteral(buffer, value, encoding, std_strings);
1014 }
1015
1016 free(options);
1017
1018 return true;
1019}
static char * encoding
Definition initdb.c:139
int i
Definition isn.c:77
static size_t noptions
void appendPQExpBuffer(PQExpBuffer str, const char *fmt,...)
#define free(a)
const char * fmtId(const char *rawid)
bool parsePGArray(const char *atext, char ***itemarray, int *nitems)
void appendStringLiteral(PQExpBuffer buf, const char *str, int encoding, bool std_strings)
const char * name

References appendPQExpBuffer(), appendPQExpBufferStr(), appendStringLiteral(), encoding, fb(), fmtId(), free, i, name, noptions, parsePGArray(), and value.

Referenced by appendReloptionsArrayAH(), and get_create_object_cmd().

◆ appendShellString()

void appendShellString ( PQExpBuffer  buf,
const char str 
)

Definition at line 580 of file string_utils.c.

581{
583 {
585 _("shell command argument contains a newline or carriage return: \"%s\"\n"),
586 str);
588 }
589}
bool appendShellStringNoError(PQExpBuffer buf, const char *str)

References _, appendShellStringNoError(), buf, EXIT_FAILURE, fb(), fprintf, and str.

Referenced by cluster_conn_opts(), ensureCleanShutdown(), generate_old_dump(), getRestoreCommand(), main(), output_completion_banner(), runPgDump(), start_standby_server(), and test_specific_config_settings().

◆ appendShellStringNoError()

bool appendShellStringNoError ( PQExpBuffer  buf,
const char str 
)

Definition at line 592 of file string_utils.c.

593{
594#ifdef WIN32
595 int backslash_run_length = 0;
596#endif
597 bool ok = true;
598 const char *p;
599
600 /*
601 * Don't bother with adding quotes if the string is nonempty and clearly
602 * contains only safe characters.
603 */
604 if (*str != '\0' &&
605 strspn(str, "abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ0123456789-_./:") == strlen(str))
606 {
608 return ok;
609 }
610
611#ifndef WIN32
613 for (p = str; *p; p++)
614 {
615 if (*p == '\n' || *p == '\r')
616 {
617 ok = false;
618 continue;
619 }
620
621 if (*p == '\'')
622 appendPQExpBufferStr(buf, "'\"'\"'");
623 else
625 }
627#else /* WIN32 */
628
629 /*
630 * A Windows system() argument experiences two layers of interpretation.
631 * First, cmd.exe interprets the string. Its behavior is undocumented,
632 * but a caret escapes any byte except LF or CR that would otherwise have
633 * special meaning. Handling of a caret before LF or CR differs between
634 * "cmd.exe /c" and other modes, and it is unusable here.
635 *
636 * Second, the new process parses its command line to construct argv (see
637 * https://msdn.microsoft.com/en-us/library/17w5ykft.aspx). This treats
638 * backslash-double quote sequences specially.
639 */
641 for (p = str; *p; p++)
642 {
643 if (*p == '\n' || *p == '\r')
644 {
645 ok = false;
646 continue;
647 }
648
649 /* Change N backslashes before a double quote to 2N+1 backslashes. */
650 if (*p == '"')
651 {
653 {
656 }
658 }
659 else if (*p == '\\')
661 else
663
664 /*
665 * Decline to caret-escape the most mundane characters, to ease
666 * debugging and lest we approach the command length limit.
667 */
668 if (!((*p >= 'a' && *p <= 'z') ||
669 (*p >= 'A' && *p <= 'Z') ||
670 (*p >= '0' && *p <= '9')))
673 }
674
675 /*
676 * Change N backslashes at end of argument to 2N backslashes, because they
677 * precede the double quote that terminates the argument.
678 */
680 {
683 }
685#endif /* WIN32 */
686
687 return ok;
688}

References appendPQExpBufferChar(), appendPQExpBufferStr(), buf, fb(), and str.

Referenced by appendShellString(), and psql_get_variable().

◆ appendStringLiteral()

void appendStringLiteral ( PQExpBuffer  buf,
const char str,
int  encoding,
bool  std_strings 
)

Definition at line 351 of file string_utils.c.

353{
354 size_t length = strlen(str);
355 const char *source = str;
356 char *target;
357 size_t remaining = length;
358
359 if (!enlargePQExpBuffer(buf, 2 * length + 2))
360 return;
361
362 target = buf->data + buf->len;
363 *target++ = '\'';
364
365 while (remaining > 0)
366 {
367 char c = *source;
368 int charlen;
369 int i;
370
371 /* Fast path for plain ASCII */
372 if (!IS_HIGHBIT_SET(c))
373 {
374 /* Apply quoting if needed */
375 if (SQL_STR_DOUBLE(c, !std_strings))
376 *target++ = c;
377 /* Copy the character */
378 *target++ = c;
379 source++;
380 remaining--;
381 continue;
382 }
383
384 /* Slow path for possible multibyte characters */
385 charlen = PQmblen(source, encoding);
386
387 if (remaining < charlen ||
389 {
390 /*
391 * Multibyte character is invalid. It's important to verify that
392 * as invalid multibyte characters could e.g. be used to "skip"
393 * over quote characters, e.g. when parsing
394 * character-by-character.
395 *
396 * Replace the character's first byte with an invalid sequence.
397 * The invalid sequence ensures that the escaped string will
398 * trigger an error on the server-side, even if we can't directly
399 * report an error here.
400 *
401 * We know there's enough space for the invalid sequence because
402 * the "target" buffer is 2 * length + 2 long, and at worst we're
403 * replacing a single input byte with two invalid bytes.
404 *
405 * It would be a bit faster to verify the whole string the first
406 * time we encounter a set highbit, but this way we can replace
407 * just the invalid data, which probably makes it easier for users
408 * to find the invalidly encoded portion of a larger string.
409 */
411 target += 2;
412
413 /*
414 * Handle the following bytes as if this byte didn't exist. That's
415 * safer in case the subsequent bytes contain important characters
416 * for the caller (e.g. '>' in html).
417 */
418 source++;
419 remaining--;
420 }
421 else
422 {
423 /* Copy the character */
424 for (i = 0; i < charlen; i++)
425 {
426 *target++ = *source++;
427 remaining--;
428 }
429 }
430 }
431
432 /* Write the terminating quote and NUL character. */
433 *target++ = '\'';
434 *target = '\0';
435
436 buf->len = target - buf->data;
437}
#define IS_HIGHBIT_SET(ch)
Definition c.h:1300
#define SQL_STR_DOUBLE(ch, escape_backslash)
Definition c.h:1308
int PQmblen(const char *s, int encoding)
Definition fe-misc.c:1255
int remaining
Definition informix.c:692
void pg_encoding_set_invalid(int encoding, char *dst)
Definition wchar.c:1852
int pg_encoding_verifymbchar(int encoding, const char *mbstr, int len)
Definition wchar.c:1989

References buf, encoding, enlargePQExpBuffer(), fb(), i, IS_HIGHBIT_SET, pg_encoding_set_invalid(), pg_encoding_verifymbchar(), PQmblen(), remaining, source, SQL_STR_DOUBLE, and str.

Referenced by appendReloptionsArray(), appendStringLiteralConn(), and escape_append_literal().

◆ appendStringLiteralConn()

void appendStringLiteralConn ( PQExpBuffer  buf,
const char str,
PGconn conn 
)

Definition at line 446 of file string_utils.c.

447{
448 size_t length = strlen(str);
449
450 /*
451 * XXX This is a kluge to silence escape_string_warning in our utility
452 * programs. It can go away once pre-v19 servers are out of support.
453 */
454 if (strchr(str, '\\') != NULL && PQserverVersion(conn) < 190000)
455 {
456 /* ensure we are not adjacent to an identifier */
457 if (buf->len > 0 && buf->data[buf->len - 1] != ' ')
461 return;
462 }
463 /* XXX end kluge */
464
465 if (!enlargePQExpBuffer(buf, 2 * length + 2))
466 return;
468 buf->len += PQescapeStringConn(conn, buf->data + buf->len,
469 str, length, NULL);
471}
#define ESCAPE_STRING_SYNTAX
Definition c.h:1311
int PQserverVersion(const PGconn *conn)
int PQclientEncoding(const PGconn *conn)
size_t PQescapeStringConn(PGconn *conn, char *to, const char *from, size_t length, int *error)
Definition fe-exec.c:4213
PGconn * conn
Definition streamutil.c:52

References appendPQExpBufferChar(), appendStringLiteral(), buf, conn, enlargePQExpBuffer(), ESCAPE_STRING_SYNTAX, fb(), PQclientEncoding(), PQescapeStringConn(), PQserverVersion(), and str.

Referenced by append_db_pattern_cte(), append_rel_pattern_filtered_cte(), append_rel_pattern_raw_cte(), appendQualifiedRelation(), create_logical_replication_slots(), dumpRoles(), dumpTablespaces(), dumpUserConfig(), emitShSecLabels(), get_parallel_tables_list(), getTables(), lookup_object_oid(), main(), makeAlterConfigCommand(), processSQLNamePattern(), retrieve_objects(), and setup_connection().

◆ appendStringLiteralDQ()

void appendStringLiteralDQ ( PQExpBuffer  buf,
const char str,
const char dqprefix 
)

Definition at line 484 of file string_utils.c.

485{
486 static const char suffixes[] = "_XXXXXXX";
487 int nextchar = 0;
489
490 /* start with $ + dqprefix if not NULL */
492 if (dqprefix)
494
495 /*
496 * Make sure we choose a delimiter which (without the trailing $) is not
497 * present in the string being quoted. We don't check with the trailing $
498 * because a string ending in $foo must not be quoted with $foo$.
499 */
500 while (strstr(str, delimBuf->data) != NULL)
501 {
503 nextchar %= sizeof(suffixes) - 1;
504 }
505
506 /* add trailing $ */
508
509 /* quote it and we are all done */
513
515}
PQExpBuffer createPQExpBuffer(void)
Definition pqexpbuffer.c:72
void destroyPQExpBuffer(PQExpBuffer str)

References appendPQExpBufferChar(), appendPQExpBufferStr(), buf, createPQExpBuffer(), destroyPQExpBuffer(), fb(), and str.

Referenced by dumpFunc().

◆ defaultGetLocalPQExpBuffer()

static PQExpBuffer defaultGetLocalPQExpBuffer ( void  )
static

◆ fmtId()

const char * fmtId ( const char rawid)

Definition at line 248 of file string_utils.c.

249{
250 return fmtIdEnc(rawid, getFmtEncoding());
251}
static int getFmtEncoding(void)

References fb(), fmtIdEnc(), and getFmtEncoding().

Referenced by _doSetFixedOutputState(), _getObjectDescription(), _printTableAccessMethodNoStorage(), _printTocEntry(), _selectOutputSchema(), _selectTableAccessMethod(), _selectTablespace(), append_depends_on_extension(), appendReloptionsArray(), binary_upgrade_extension_member(), buildACLCommands(), buildDefaultACLCommands(), createDummyViewAsClause(), describeOneTableDetails(), dropDBs(), dropRoles(), dropTablespaces(), dumpAccessMethod(), dumpAgg(), dumpAttrDef(), dumpBaseType(), dumpCast(), dumpCollation(), dumpCommentExtended(), dumpCompositeType(), dumpCompositeTypeColComments(), dumpConstraint(), dumpConversion(), dumpDatabase(), dumpDomain(), dumpEnumType(), dumpEventTrigger(), dumpExtension(), dumpForeignDataWrapper(), dumpForeignServer(), dumpFunc(), dumpIndex(), dumpNamespace(), dumpOpclass(), dumpOpfamily(), dumpOpr(), dumpPolicy(), dumpProcLang(), dumpPublication(), dumpPublicationNamespace(), dumpPublicationTable(), dumpRangeType(), dumpRoleGUCPrivs(), dumpRoleMembership(), dumpRoles(), dumpRule(), dumpSearchPath(), dumpSecLabel(), dumpSequence(), dumpStatisticsExt(), dumpSubscription(), dumpTable(), dumpTableComment(), dumpTableConstraintComment(), dumpTableData_insert(), dumpTableSchema(), dumpTableSecLabel(), dumpTablespaces(), dumpTransform(), dumpTrigger(), dumpTSConfig(), dumpTSDictionary(), dumpTSParser(), dumpTSTemplate(), dumpUndefinedType(), dumpUserMappings(), emitShSecLabels(), escape_fmt_id(), fmtCopyColumnList(), format_aggregate_signature(), format_function_arguments(), format_function_signature(), get_create_object_cmd(), get_language_name(), getFormattedOperatorName(), getPublicationTables(), main(), makeAlterConfigCommand(), and setup_connection().

◆ fmtIdEnc()

const char * fmtIdEnc ( const char rawid,
int  encoding 
)

Definition at line 101 of file string_utils.c.

102{
104
105 const char *cp;
106 bool need_quotes = false;
107 size_t remaining = strlen(rawid);
108
109 /*
110 * These checks need to match the identifier production in scan.l. Don't
111 * use islower() etc.
112 */
114 need_quotes = true;
115 /* slightly different rules for first character */
116 else if (!((rawid[0] >= 'a' && rawid[0] <= 'z') || rawid[0] == '_'))
117 need_quotes = true;
118 else
119 {
120 /* otherwise check the entire string */
121 cp = rawid;
122 for (size_t i = 0; i < remaining; i++, cp++)
123 {
124 if (!((*cp >= 'a' && *cp <= 'z')
125 || (*cp >= '0' && *cp <= '9')
126 || (*cp == '_')))
127 {
128 need_quotes = true;
129 break;
130 }
131 }
132 }
133
134 if (!need_quotes)
135 {
136 /*
137 * Check for keyword. We quote keywords except for unreserved ones.
138 * (In some cases we could avoid quoting a col_name or type_func_name
139 * keyword, but it seems much harder than it's worth to tell that.)
140 *
141 * Note: ScanKeywordLookup() does case-insensitive comparison, but
142 * that's fine, since we already know we have all-lower-case.
143 */
145
147 need_quotes = true;
148 }
149
150 if (!need_quotes)
151 {
152 /* no quoting needed */
154 }
155 else
156 {
158
159 cp = &rawid[0];
160 while (remaining > 0)
161 {
162 int charlen;
163
164 /* Fast path for plain ASCII */
165 if (!IS_HIGHBIT_SET(*cp))
166 {
167 /*
168 * Did we find a double-quote in the string? Then make this a
169 * double double-quote per SQL99. Before, we put in a
170 * backslash/double-quote pair. - thomas 2000-08-05
171 */
172 if (*cp == '"')
175 remaining--;
176 cp++;
177 continue;
178 }
179
180 /* Slow path for possible multibyte characters */
181 charlen = pg_encoding_mblen(encoding, cp);
182
183 if (remaining < charlen ||
184 pg_encoding_verifymbchar(encoding, cp, charlen) == -1)
185 {
186 /*
187 * Multibyte character is invalid. It's important to verify
188 * that as invalid multibyte characters could e.g. be used to
189 * "skip" over quote characters, e.g. when parsing
190 * character-by-character.
191 *
192 * Replace the character's first byte with an invalid
193 * sequence. The invalid sequence ensures that the escaped
194 * string will trigger an error on the server-side, even if we
195 * can't directly report an error here.
196 *
197 * It would be a bit faster to verify the whole string the
198 * first time we encounter a set highbit, but this way we can
199 * replace just the invalid data, which probably makes it
200 * easier for users to find the invalidly encoded portion of a
201 * larger string.
202 */
204 {
206 id_return->data + id_return->len);
207 id_return->len += 2;
208 id_return->data[id_return->len] = '\0';
209 }
210
211 /*
212 * Handle the following bytes as if this byte didn't exist.
213 * That's safer in case the subsequent bytes contain
214 * characters that are significant for the caller (e.g. '>' in
215 * html).
216 */
217 remaining--;
218 cp++;
219 }
220 else
221 {
222 for (int i = 0; i < charlen; i++)
223 {
225 remaining--;
226 cp++;
227 }
228 }
229 }
230
232 }
233
234 return id_return->data;
235}
const uint8 ScanKeywordCategories[SCANKEYWORDS_NUM_KEYWORDS]
Definition keywords.c:29
PGDLLIMPORT const ScanKeywordList ScanKeywords
#define UNRESERVED_KEYWORD
Definition keywords.h:20
int ScanKeywordLookup(const char *str, const ScanKeywordList *keywords)
Definition kwlookup.c:38
PQExpBuffer(* getLocalPQExpBuffer)(void)
int quote_all_identifiers
int pg_encoding_mblen(int encoding, const char *mbstr)
Definition wchar.c:1935

References appendPQExpBufferChar(), appendPQExpBufferStr(), encoding, enlargePQExpBuffer(), fb(), getLocalPQExpBuffer, i, IS_HIGHBIT_SET, pg_encoding_mblen(), pg_encoding_set_invalid(), pg_encoding_verifymbchar(), quote_all_identifiers, remaining, ScanKeywordCategories, ScanKeywordLookup(), ScanKeywords, and UNRESERVED_KEYWORD.

Referenced by appendPsqlMetaConnect(), fmtId(), fmtQualifiedIdEnc(), gen_reindex_command(), and main().

◆ fmtQualifiedId()

const char * fmtQualifiedId ( const char schema,
const char id 
)

Definition at line 296 of file string_utils.c.

297{
298 return fmtQualifiedIdEnc(schema, id, getFmtEncoding());
299}
const char * fmtQualifiedIdEnc(const char *schema, const char *id, int encoding)

References fmtQualifiedIdEnc(), and getFmtEncoding().

Referenced by _disableTriggersIfNecessary(), _enableTriggersIfNecessary(), _printTableAccessMethodNoStorage(), is_load_via_partition_root(), lockTableForWorker(), and restore_toc_entry().

◆ fmtQualifiedIdEnc()

const char * fmtQualifiedIdEnc ( const char schema,
const char id,
int  encoding 
)

Definition at line 263 of file string_utils.c.

264{
267
268 /* Some callers might fail to provide a schema name */
269 if (schema && *schema)
270 {
272 }
274
276
279
280 return id_return->data;
281}

References appendPQExpBuffer(), appendPQExpBufferStr(), createPQExpBuffer(), destroyPQExpBuffer(), encoding, fb(), fmtIdEnc(), and getLocalPQExpBuffer.

Referenced by appendQualifiedRelation(), fmtQualifiedId(), get_parallel_tabidx_list(), get_parallel_tables_list(), and retrieve_objects().

◆ formatPGVersionNumber()

char * formatPGVersionNumber ( int  version_number,
bool  include_minor,
char buf,
size_t  buflen 
)

Definition at line 313 of file string_utils.c.

315{
316 if (version_number >= 100000)
317 {
318 /* New two-part style */
319 if (include_minor)
320 snprintf(buf, buflen, "%d.%d", version_number / 10000,
321 version_number % 10000);
322 else
323 snprintf(buf, buflen, "%d", version_number / 10000);
324 }
325 else
326 {
327 /* Old three-part style */
328 if (include_minor)
329 snprintf(buf, buflen, "%d.%d.%d", version_number / 10000,
330 (version_number / 100) % 100,
331 version_number % 100);
332 else
333 snprintf(buf, buflen, "%d.%d", version_number / 10000,
334 (version_number / 100) % 100);
335 }
336 return buf;
337}
#define snprintf
Definition port.h:261

References buf, fb(), and snprintf.

Referenced by connection_warnings(), describeAccessMethods(), describeFunctions(), describePublications(), describeSubscriptions(), listEventTriggers(), listExtendedStats(), listPartitionedTables(), listPublications(), printVersion(), and SyncVariables().

◆ getFmtEncoding()

static int getFmtEncoding ( void  )
static

Definition at line 78 of file string_utils.c.

79{
80 if (fmtIdEncoding != -1)
81 return fmtIdEncoding;
82
83 /*
84 * In assertion builds it seems best to fail hard if the encoding was not
85 * set, to make it easier to find places with missing calls. But in
86 * production builds that seems like a bad idea, thus we instead just
87 * default to UTF-8.
88 */
89 Assert(fmtIdEncoding != -1);
90
91 return PG_UTF8;
92}
#define Assert(condition)
Definition c.h:999
#define PG_UTF8
Definition mbprint.c:43

References Assert, fb(), and PG_UTF8.

Referenced by fmtId(), and fmtQualifiedId().

◆ parsePGArray()

bool parsePGArray ( const char atext,
char ***  itemarray,
int nitems 
)

Definition at line 817 of file string_utils.c.

818{
819 int inputlen;
820 char **items;
821 char *strings;
822 int curitem;
823
824 /*
825 * We expect input in the form of "{item,item,item}" where any item is
826 * either raw data, or surrounded by double quotes (in which case embedded
827 * characters including backslashes and quotes are backslashed).
828 *
829 * We build the result as an array of pointers followed by the actual
830 * string data, all in one malloc block for convenience of deallocation.
831 * The worst-case storage need is not more than one pointer and one
832 * character for each input character (consider "{,,,,,,,,,,}").
833 */
834 *itemarray = NULL;
835 *nitems = 0;
837 if (inputlen < 2 || atext[0] != '{' || atext[inputlen - 1] != '}')
838 return false; /* bad input */
839 items = (char **) malloc(inputlen * (sizeof(char *) + sizeof(char)));
840 if (items == NULL)
841 return false; /* out of memory */
842 *itemarray = items;
843 strings = (char *) (items + inputlen);
844
845 atext++; /* advance over initial '{' */
846 curitem = 0;
847 while (*atext != '}')
848 {
849 if (*atext == '\0')
850 return false; /* premature end of string */
851 items[curitem] = strings;
852 while (*atext != '}' && *atext != ',')
853 {
854 if (*atext == '\0')
855 return false; /* premature end of string */
856 if (*atext != '"')
857 *strings++ = *atext++; /* copy unquoted data */
858 else
859 {
860 /* process quoted substring */
861 atext++;
862 while (*atext != '"')
863 {
864 if (*atext == '\0')
865 return false; /* premature end of string */
866 if (*atext == '\\')
867 {
868 atext++;
869 if (*atext == '\0')
870 return false; /* premature end of string */
871 }
872 *strings++ = *atext++; /* copy quoted data */
873 }
874 atext++;
875 }
876 }
877 *strings++ = '\0';
878 if (*atext == ',')
879 atext++;
880 curitem++;
881 }
882 if (atext[1] != '\0')
883 return false; /* bogus syntax (embedded '}') */
884 *nitems = curitem;
885 return true;
886}
#define nitems(x)
Definition indent.h:31
#define malloc(a)
static ItemArray items

References fb(), items, malloc, and nitems.

Referenced by appendReloptionsArray(), buildACLCommands(), dumpFunc(), dumpIndex(), dumpSearchPath(), dumpSubscription(), getIndexes(), getPublicationTables(), and processExtensionTables().

◆ patternToSQLRegex()

void patternToSQLRegex ( int  encoding,
PQExpBuffer  dbnamebuf,
PQExpBuffer  schemabuf,
PQExpBuffer  namebuf,
const char pattern,
bool  force_escape,
bool  want_literal_dbname,
int dotcnt 
)

Definition at line 1223 of file string_utils.c.

1226{
1231 int i;
1232 bool inquotes;
1233 bool left;
1234 const char *cp;
1235
1236 Assert(pattern != NULL);
1237 Assert(namebuf != NULL);
1238
1239 /* callers should never expect "dbname.relname" format */
1241 Assert(dotcnt != NULL);
1242
1243 *dotcnt = 0;
1244 inquotes = false;
1245 cp = pattern;
1246
1247 if (dbnamebuf != NULL)
1248 maxbuf = &buf[2];
1249 else if (schemabuf != NULL)
1250 maxbuf = &buf[1];
1251 else
1252 maxbuf = &buf[0];
1253
1254 curbuf = &buf[0];
1256 {
1257 left = true;
1259 }
1260 else
1261 left = false;
1264 while (*cp)
1265 {
1266 char ch = *cp;
1267
1268 if (ch == '"')
1269 {
1270 if (inquotes && cp[1] == '"')
1271 {
1272 /* emit one quote, stay in inquotes mode */
1274 if (left)
1276 cp++;
1277 }
1278 else
1279 inquotes = !inquotes;
1280 cp++;
1281 }
1282 else if (!inquotes && isupper((unsigned char) ch))
1283 {
1285 pg_tolower((unsigned char) ch));
1286 if (left)
1288 pg_tolower((unsigned char) ch));
1289 cp++;
1290 }
1291 else if (!inquotes && ch == '*')
1292 {
1294 if (left)
1296 cp++;
1297 }
1298 else if (!inquotes && ch == '?')
1299 {
1301 if (left)
1303 cp++;
1304 }
1305 else if (!inquotes && ch == '.')
1306 {
1307 left = false;
1308 if (dotcnt)
1309 (*dotcnt)++;
1310 if (curbuf < maxbuf)
1311 {
1313 curbuf++;
1316 cp++;
1317 }
1318 else
1320 }
1321 else if (ch == '$')
1322 {
1323 /*
1324 * Dollar is always quoted, whether inside quotes or not. The
1325 * reason is that it's allowed in SQL identifiers, so there's a
1326 * significant use-case for treating it literally, while because
1327 * we anchor the pattern automatically there is no use-case for
1328 * having it possess its regexp meaning.
1329 */
1331 if (left)
1333 cp++;
1334 }
1335 else
1336 {
1337 /*
1338 * Ordinary data character, transfer to pattern
1339 *
1340 * Inside double quotes, or at all times if force_escape is true,
1341 * quote regexp special characters with a backslash to avoid
1342 * regexp errors. Outside quotes, however, let them pass through
1343 * as-is; this lets knowledgeable users build regexp expressions
1344 * that are more powerful than shell-style patterns.
1345 *
1346 * As an exception to that, though, always quote "[]", as that's
1347 * much more likely to be an attempt to write an array type name
1348 * than it is to be the start of a regexp bracket expression.
1349 */
1350 if ((inquotes || force_escape) &&
1351 strchr("|*+?()[]{}.^$\\", ch))
1353 else if (ch == '[' && cp[1] == ']')
1356 while (i--)
1357 {
1358 if (left)
1361 }
1362 }
1363 }
1365
1366 if (namebuf)
1367 {
1370 curbuf--;
1371 }
1372
1373 if (schemabuf && curbuf >= buf)
1374 {
1377 curbuf--;
1378 }
1379
1380 if (dbnamebuf && curbuf >= buf)
1381 {
1384 else
1387 }
1388
1391}
int PQmblenBounded(const char *s, int encoding)
Definition fe-misc.c:1266
unsigned char pg_tolower(unsigned char ch)

References appendPQExpBufferChar(), appendPQExpBufferStr(), Assert, buf, encoding, fb(), i, initPQExpBuffer(), pg_tolower(), PQmblenBounded(), and termPQExpBuffer().

Referenced by append_database_pattern(), append_relation_pattern_helper(), append_schema_pattern(), and processSQLNamePattern().

◆ processSQLNamePattern()

bool processSQLNamePattern ( PGconn conn,
PQExpBuffer  buf,
const char pattern,
bool  have_where,
bool  force_escape,
const char schemavar,
const char namevar,
const char altnamevar,
const char visibilityrule,
PQExpBuffer  dbnamebuf,
int dotcnt 
)

Definition at line 1051 of file string_utils.c.

1056{
1059 bool added_clause = false;
1060 int dcnt;
1061
1062#define WHEREAND() \
1063 (appendPQExpBufferStr(buf, have_where ? " AND " : "WHERE "), \
1064 have_where = true, added_clause = true)
1065
1066 if (dotcnt == NULL)
1067 dotcnt = &dcnt;
1068 *dotcnt = 0;
1069 if (pattern == NULL)
1070 {
1071 /* Default: select all visible objects */
1072 if (visibilityrule)
1073 {
1074 WHEREAND();
1076 }
1077 return added_clause;
1078 }
1079
1082
1083 /*
1084 * Convert shell-style 'pattern' into the regular expression(s) we want to
1085 * execute. Quoting/escaping into SQL literal format will be done below
1086 * using appendStringLiteralConn().
1087 *
1088 * If the caller provided a schemavar, we want to split the pattern on
1089 * ".", otherwise not.
1090 */
1092 (schemavar ? dbnamebuf : NULL),
1093 (schemavar ? &schemabuf : NULL),
1094 &namebuf,
1095 pattern, force_escape, true, dotcnt);
1096
1097 /*
1098 * Now decide what we need to emit. We may run under a hostile
1099 * search_path, so qualify EVERY name. Note there will be a leading "^("
1100 * in the patterns in any case.
1101 *
1102 * We want the regex matches to use the database's default collation where
1103 * collation-sensitive behavior is required (for example, which characters
1104 * match '\w'). That happened by default before PG v12, but if the server
1105 * is >= v12 then we need to force it through explicit COLLATE clauses,
1106 * otherwise the "C" collation attached to "name" catalog columns wins.
1107 */
1108 if (namevar && namebuf.len > 2)
1109 {
1110 /* We have a name pattern, so constrain the namevar(s) */
1111
1112 /* Optimize away a "*" pattern */
1113 if (strcmp(namebuf.data, "^(.*)$") != 0)
1114 {
1115 WHEREAND();
1116 if (altnamevar)
1117 {
1119 "(%s OPERATOR(pg_catalog.~) ", namevar);
1121 if (PQserverVersion(conn) >= 120000)
1122 appendPQExpBufferStr(buf, " COLLATE pg_catalog.default");
1124 "\n OR %s OPERATOR(pg_catalog.~) ",
1125 altnamevar);
1127 if (PQserverVersion(conn) >= 120000)
1128 appendPQExpBufferStr(buf, " COLLATE pg_catalog.default");
1129 appendPQExpBufferStr(buf, ")\n");
1130 }
1131 else
1132 {
1133 appendPQExpBuffer(buf, "%s OPERATOR(pg_catalog.~) ", namevar);
1135 if (PQserverVersion(conn) >= 120000)
1136 appendPQExpBufferStr(buf, " COLLATE pg_catalog.default");
1138 }
1139 }
1140 }
1141
1142 if (schemavar && schemabuf.len > 2)
1143 {
1144 /* We have a schema pattern, so constrain the schemavar */
1145
1146 /* Optimize away a "*" pattern */
1147 if (strcmp(schemabuf.data, "^(.*)$") != 0 && schemavar)
1148 {
1149 WHEREAND();
1150 appendPQExpBuffer(buf, "%s OPERATOR(pg_catalog.~) ", schemavar);
1152 if (PQserverVersion(conn) >= 120000)
1153 appendPQExpBufferStr(buf, " COLLATE pg_catalog.default");
1155 }
1156 }
1157 else
1158 {
1159 /* No schema pattern given, so select only visible objects */
1160 if (visibilityrule)
1161 {
1162 WHEREAND();
1164 }
1165 }
1166
1169
1170 return added_clause;
1171#undef WHEREAND
1172}
void appendStringLiteralConn(PQExpBuffer buf, const char *str, PGconn *conn)
void patternToSQLRegex(int encoding, PQExpBuffer dbnamebuf, PQExpBuffer schemabuf, PQExpBuffer namebuf, const char *pattern, bool force_escape, bool want_literal_dbname, int *dotcnt)
#define WHEREAND()

References appendPQExpBuffer(), appendPQExpBufferChar(), appendPQExpBufferStr(), appendStringLiteralConn(), buf, conn, fb(), initPQExpBuffer(), patternToSQLRegex(), PQclientEncoding(), PQserverVersion(), termPQExpBuffer(), and WHEREAND.

Referenced by describeConfigurationParameters(), expand_dbname_patterns(), expand_extension_name_patterns(), expand_foreign_server_name_patterns(), expand_schema_name_patterns(), expand_table_name_patterns(), and validateSQLNamePattern().

◆ setFmtEncoding()

void setFmtEncoding ( int  encoding)

Variable Documentation

◆ getLocalPQExpBuffer

PQExpBuffer(* getLocalPQExpBuffer) (void) ( void  )
default

Definition at line 28 of file string_utils.c.

43{
44 static PQExpBuffer id_return = NULL;
45
46 if (id_return) /* first time through? */
47 {
48 /* same buffer, just wipe contents */
50 }
51 else
52 {
53 /* new buffer */
55 }
56
57 return id_return;
58}
void resetPQExpBuffer(PQExpBuffer str)

Referenced by fmtIdEnc(), fmtQualifiedIdEnc(), and ParallelBackupStart().

◆ quote_all_identifiers

int quote_all_identifiers = 0

Definition at line 27 of file string_utils.c.

Referenced by fmtIdEnc().