Set psql client encoding from locale by default

Add a new libpq connection option client_encoding (which includes the
existing PGCLIENTENCODING environment variable), which besides an
encoding name accepts a special value "auto" that tries to determine
the encoding from the locale in the client's environment, using the
mechanisms that have been in use in initdb.

psql sets this new connection option to "auto" when running from a
terminal and not overridden by setting PGCLIENTENCODING.

original code by Heikki Linnakangas, with subsequent contributions by
Jaime Casanova, Peter Eisentraut, Stephen Frost, Ibrar Ahmed
This commit is contained in:
Peter Eisentraut 2011-02-19 08:54:58 +02:00
parent 327e025071
commit 02e14562a8
10 changed files with 136 additions and 24 deletions

View File

@ -259,6 +259,21 @@ PGconn *PQconnectdbParams(const char **keywords, const char **values, int expand
</listitem> </listitem>
</varlistentry> </varlistentry>
<varlistentry id="libpq-connect-client-encoding" xreflabel="client_encoding">
<term><literal>client_encoding</literal></term>
<listitem>
<para>
This sets the <varname>client_encoding</varname>
configuration parameter for this connection. In addition to
the values accepted by the corresponding server option, you
can use <literal>auto</literal> to determine the right
encoding from the current locale in the client
(<envar>LC_CTYPE</envar> environment variable on Unix
systems).
</para>
</listitem>
</varlistentry>
<varlistentry id="libpq-connect-options" xreflabel="options"> <varlistentry id="libpq-connect-options" xreflabel="options">
<term><literal>options</literal></term> <term><literal>options</literal></term>
<listitem> <listitem>
@ -6345,6 +6360,16 @@ myEventProc(PGEventId evtId, void *evtInfo, void *passThrough)
linkend="libpq-connect-connect-timeout"> connection parameter. linkend="libpq-connect-connect-timeout"> connection parameter.
</para> </para>
</listitem> </listitem>
<listitem>
<para>
<indexterm>
<primary><envar>PGCLIENTENCODING</envar></primary>
</indexterm>
<envar>PGCLIENTENCODING</envar> behaves the same as the <xref
linkend="libpq-connect-client-encoding"> connection parameter.
</para>
</listitem>
</itemizedlist> </itemizedlist>
</para> </para>
@ -6378,17 +6403,6 @@ myEventProc(PGEventId evtId, void *evtInfo, void *passThrough)
</para> </para>
</listitem> </listitem>
<listitem>
<para>
<indexterm>
<primary><envar>PGCLIENTENCODING</envar></primary>
</indexterm>
<envar>PGCLIENTENCODING</envar> sets the default client character
set encoding. (Equivalent to <literal>SET client_encoding TO
...</literal>.)
</para>
</listitem>
<listitem> <listitem>
<para> <para>
<indexterm> <indexterm>

View File

@ -593,6 +593,17 @@ $ <userinput>psql "service=myservice sslmode=require"</userinput>
privileges, server is not running on the targeted host, etc.), privileges, server is not running on the targeted host, etc.),
<application>psql</application> will return an error and terminate. <application>psql</application> will return an error and terminate.
</para> </para>
<para>
If at least one of standard input or standard output are a
terminal, then <application>psql</application> sets the client
encoding to <quote>auto</quote>, which will detect the
appropriate client encoding from the locale settings
(<envar>LC_CTYPE</envar> environment variable on Unix systems).
If this doesn't work out as expected, the client encoding can be
overridden using the environment
variable <envar>PGCLIENTENCODING</envar>.
</para>
</refsect2> </refsect2>
<refsect2 id="R2-APP-PSQL-4"> <refsect2 id="R2-APP-PSQL-4">

View File

@ -1487,7 +1487,7 @@ do_connect(char *dbname, char *user, char *host, char *port)
while (true) while (true)
{ {
#define PARAMS_ARRAY_SIZE 7 #define PARAMS_ARRAY_SIZE 8
const char **keywords = pg_malloc(PARAMS_ARRAY_SIZE * sizeof(*keywords)); const char **keywords = pg_malloc(PARAMS_ARRAY_SIZE * sizeof(*keywords));
const char **values = pg_malloc(PARAMS_ARRAY_SIZE * sizeof(*values)); const char **values = pg_malloc(PARAMS_ARRAY_SIZE * sizeof(*values));
@ -1503,8 +1503,10 @@ do_connect(char *dbname, char *user, char *host, char *port)
values[4] = dbname; values[4] = dbname;
keywords[5] = "fallback_application_name"; keywords[5] = "fallback_application_name";
values[5] = pset.progname; values[5] = pset.progname;
keywords[6] = NULL; keywords[6] = "client_encoding";
values[6] = NULL; values[6] = (pset.notty || getenv("PGCLIENTENCODING")) ? NULL : "auto";
keywords[7] = NULL;
values[7] = NULL;
n_conn = PQconnectdbParams(keywords, values, true); n_conn = PQconnectdbParams(keywords, values, true);

View File

@ -171,7 +171,7 @@ main(int argc, char *argv[])
/* loop until we have a password if requested by backend */ /* loop until we have a password if requested by backend */
do do
{ {
#define PARAMS_ARRAY_SIZE 7 #define PARAMS_ARRAY_SIZE 8
const char **keywords = pg_malloc(PARAMS_ARRAY_SIZE * sizeof(*keywords)); const char **keywords = pg_malloc(PARAMS_ARRAY_SIZE * sizeof(*keywords));
const char **values = pg_malloc(PARAMS_ARRAY_SIZE * sizeof(*values)); const char **values = pg_malloc(PARAMS_ARRAY_SIZE * sizeof(*values));
@ -189,8 +189,10 @@ main(int argc, char *argv[])
"postgres" : options.dbname; "postgres" : options.dbname;
keywords[5] = "fallback_application_name"; keywords[5] = "fallback_application_name";
values[5] = pset.progname; values[5] = pset.progname;
keywords[6] = NULL; keywords[6] = "client_encoding";
values[6] = NULL; values[6] = (pset.notty || getenv("PGCLIENTENCODING")) ? NULL : "auto";
keywords[7] = NULL;
values[7] = NULL;
new_pass = false; new_pass = false;
pset.db = PQconnectdbParams(keywords, values, true); pset.db = PQconnectdbParams(keywords, values, true);

View File

@ -1,4 +1,5 @@
/exports.list /exports.list
/chklocale.c
/crypt.c /crypt.c
/getaddrinfo.c /getaddrinfo.c
/inet_aton.c /inet_aton.c

View File

@ -35,7 +35,7 @@ OBJS= fe-auth.o fe-connect.o fe-exec.o fe-misc.o fe-print.o fe-lobj.o \
fe-protocol2.o fe-protocol3.o pqexpbuffer.o pqsignal.o fe-secure.o \ fe-protocol2.o fe-protocol3.o pqexpbuffer.o pqsignal.o fe-secure.o \
libpq-events.o libpq-events.o
# libpgport C files we always use # libpgport C files we always use
OBJS += inet_net_ntop.o noblock.o pgstrcasecmp.o thread.o OBJS += chklocale.o inet_net_ntop.o noblock.o pgstrcasecmp.o thread.o
# libpgport C files that are needed if identified by configure # libpgport C files that are needed if identified by configure
OBJS += $(filter crypt.o getaddrinfo.o inet_aton.o open.o snprintf.o strerror.o strlcpy.o win32error.o, $(LIBOBJS)) OBJS += $(filter crypt.o getaddrinfo.o inet_aton.o open.o snprintf.o strerror.o strlcpy.o win32error.o, $(LIBOBJS))
# backend/libpq # backend/libpq
@ -88,7 +88,7 @@ backend_src = $(top_srcdir)/src/backend
# For some libpgport modules, this only happens if configure decides # For some libpgport modules, this only happens if configure decides
# the module is needed (see filter hack in OBJS, above). # the module is needed (see filter hack in OBJS, above).
crypt.c getaddrinfo.c inet_aton.c inet_net_ntop.c noblock.c open.c pgsleep.c pgstrcasecmp.c snprintf.c strerror.c strlcpy.c thread.c win32error.c: % : $(top_srcdir)/src/port/% chklocale.c crypt.c getaddrinfo.c inet_aton.c inet_net_ntop.c noblock.c open.c pgsleep.c pgstrcasecmp.c snprintf.c strerror.c strlcpy.c thread.c win32error.c: % : $(top_srcdir)/src/port/%
rm -f $@ && $(LN_S) $< . rm -f $@ && $(LN_S) $< .
ip.c md5.c: % : $(backend_src)/libpq/% ip.c md5.c: % : $(backend_src)/libpq/%
@ -135,7 +135,7 @@ clean distclean: clean-lib
# Might be left over from a Win32 client-only build # Might be left over from a Win32 client-only build
rm -f pg_config_paths.h rm -f pg_config_paths.h
rm -f inet_net_ntop.c noblock.c pgstrcasecmp.c thread.c rm -f inet_net_ntop.c noblock.c pgstrcasecmp.c thread.c
rm -f crypt.c getaddrinfo.c inet_aton.c open.c snprintf.c strerror.c strlcpy.c win32error.c rm -f chklocale.c crypt.c getaddrinfo.c inet_aton.c open.c snprintf.c strerror.c strlcpy.c win32error.c
rm -f pgsleep.c rm -f pgsleep.c
rm -f md5.c ip.c rm -f md5.c ip.c
rm -f encnames.c wchar.c rm -f encnames.c wchar.c

View File

@ -175,6 +175,9 @@ static const PQconninfoOption PQconninfoOptions[] = {
{"port", "PGPORT", DEF_PGPORT_STR, NULL, {"port", "PGPORT", DEF_PGPORT_STR, NULL,
"Database-Port", "", 6}, "Database-Port", "", 6},
{"client_encoding", "PGCLIENTENCODING", NULL, NULL,
"Client-Encoding", "", 10},
/* /*
* "tty" is no longer used either, but keep it present for backwards * "tty" is no longer used either, but keep it present for backwards
* compatibility. * compatibility.
@ -270,9 +273,6 @@ static const PQEnvironmentOption EnvironmentOptions[] =
{ {
"PGTZ", "timezone" "PGTZ", "timezone"
}, },
{
"PGCLIENTENCODING", "client_encoding"
},
/* internal performance-related settings */ /* internal performance-related settings */
{ {
"PGGEQO", "geqo" "PGGEQO", "geqo"
@ -612,6 +612,8 @@ fillPGconn(PGconn *conn, PQconninfoOption *connOptions)
conn->pgpass = tmp ? strdup(tmp) : NULL; conn->pgpass = tmp ? strdup(tmp) : NULL;
tmp = conninfo_getval(connOptions, "connect_timeout"); tmp = conninfo_getval(connOptions, "connect_timeout");
conn->connect_timeout = tmp ? strdup(tmp) : NULL; conn->connect_timeout = tmp ? strdup(tmp) : NULL;
tmp = conninfo_getval(connOptions, "client_encoding");
conn->client_encoding_initial = tmp ? strdup(tmp) : NULL;
tmp = conninfo_getval(connOptions, "keepalives"); tmp = conninfo_getval(connOptions, "keepalives");
conn->keepalives = tmp ? strdup(tmp) : NULL; conn->keepalives = tmp ? strdup(tmp) : NULL;
tmp = conninfo_getval(connOptions, "keepalives_idle"); tmp = conninfo_getval(connOptions, "keepalives_idle");
@ -786,6 +788,16 @@ connectOptions2(PGconn *conn)
else else
conn->sslmode = strdup(DefaultSSLMode); conn->sslmode = strdup(DefaultSSLMode);
/*
* Resolve special "auto" client_encoding from the locale
*/
if (conn->client_encoding_initial &&
strcmp(conn->client_encoding_initial, "auto") == 0)
{
free(conn->client_encoding_initial);
conn->client_encoding_initial = strdup(pg_encoding_to_char(pg_get_encoding_from_locale(NULL, true)));
}
/* /*
* Only if we get this far is it appropriate to try to connect. (We need a * Only if we get this far is it appropriate to try to connect. (We need a
* state flag, rather than just the boolean result of this function, in * state flag, rather than just the boolean result of this function, in
@ -2508,7 +2520,7 @@ keep_going: /* We will come back to here until there is
if (PG_PROTOCOL_MAJOR(conn->pversion) < 3) if (PG_PROTOCOL_MAJOR(conn->pversion) < 3)
{ {
conn->status = CONNECTION_SETENV; conn->status = CONNECTION_SETENV;
conn->setenv_state = SETENV_STATE_OPTION_SEND; conn->setenv_state = SETENV_STATE_CLIENT_ENCODING_SEND;
conn->next_eo = EnvironmentOptions; conn->next_eo = EnvironmentOptions;
return PGRES_POLLING_WRITING; return PGRES_POLLING_WRITING;
} }
@ -4661,6 +4673,10 @@ PQsetClientEncoding(PGconn *conn, const char *encoding)
if (!encoding) if (!encoding)
return -1; return -1;
/* Resolve special "auto" value from the locale */
if (strcmp(encoding, "auto") == 0)
encoding = pg_encoding_to_char(pg_get_encoding_from_locale(NULL, true));
/* check query buffer overflow */ /* check query buffer overflow */
if (sizeof(qbuf) < (sizeof(query) + strlen(encoding))) if (sizeof(qbuf) < (sizeof(query) + strlen(encoding)))
return -1; return -1;

View File

@ -58,6 +58,7 @@ pqSetenvPoll(PGconn *conn)
switch (conn->setenv_state) switch (conn->setenv_state)
{ {
/* These are reading states */ /* These are reading states */
case SETENV_STATE_CLIENT_ENCODING_WAIT:
case SETENV_STATE_OPTION_WAIT: case SETENV_STATE_OPTION_WAIT:
case SETENV_STATE_QUERY1_WAIT: case SETENV_STATE_QUERY1_WAIT:
case SETENV_STATE_QUERY2_WAIT: case SETENV_STATE_QUERY2_WAIT:
@ -74,6 +75,7 @@ pqSetenvPoll(PGconn *conn)
} }
/* These are writing states, so we just proceed. */ /* These are writing states, so we just proceed. */
case SETENV_STATE_CLIENT_ENCODING_SEND:
case SETENV_STATE_OPTION_SEND: case SETENV_STATE_OPTION_SEND:
case SETENV_STATE_QUERY1_SEND: case SETENV_STATE_QUERY1_SEND:
case SETENV_STATE_QUERY2_SEND: case SETENV_STATE_QUERY2_SEND:
@ -98,6 +100,39 @@ pqSetenvPoll(PGconn *conn)
{ {
switch (conn->setenv_state) switch (conn->setenv_state)
{ {
/*
* The _CLIENT_ENCODING_SEND code is slightly different
* from _OPTION_SEND below (e.g., no getenv() call), which
* is why a different state is used.
*/
case SETENV_STATE_CLIENT_ENCODING_SEND:
{
char setQuery[100]; /* note length limit in
* sprintf below */
const char *val = conn->client_encoding_initial;
if (val)
{
if (pg_strcasecmp(val, "default") == 0)
sprintf(setQuery, "SET client_encoding = DEFAULT");
else
sprintf(setQuery, "SET client_encoding = '%.60s'",
val);
#ifdef CONNECTDEBUG
fprintf(stderr,
"Sending client_encoding with %s\n",
setQuery);
#endif
if (!PQsendQuery(conn, setQuery))
goto error_return;
conn->setenv_state = SETENV_STATE_CLIENT_ENCODING_WAIT;
}
else
conn->setenv_state = SETENV_STATE_OPTION_SEND;
break;
}
case SETENV_STATE_OPTION_SEND: case SETENV_STATE_OPTION_SEND:
{ {
/* /*
@ -142,6 +177,31 @@ pqSetenvPoll(PGconn *conn)
break; break;
} }
case SETENV_STATE_CLIENT_ENCODING_WAIT:
{
if (PQisBusy(conn))
return PGRES_POLLING_READING;
res = PQgetResult(conn);
if (res)
{
if (PQresultStatus(res) != PGRES_COMMAND_OK)
{
PQclear(res);
goto error_return;
}
PQclear(res);
/* Keep reading until PQgetResult returns NULL */
}
else
{
/* Query finished, so send the next option */
conn->setenv_state = SETENV_STATE_OPTION_SEND;
}
break;
}
case SETENV_STATE_OPTION_WAIT: case SETENV_STATE_OPTION_WAIT:
{ {
if (PQisBusy(conn)) if (PQisBusy(conn))

View File

@ -1933,6 +1933,9 @@ build_startup_packet(const PGconn *conn, char *packet,
ADD_STARTUP_OPTION("application_name", val); ADD_STARTUP_OPTION("application_name", val);
} }
if (conn->client_encoding_initial && conn->client_encoding_initial[0])
ADD_STARTUP_OPTION("client_encoding", conn->client_encoding_initial);
/* Add any environment-driven GUC settings needed */ /* Add any environment-driven GUC settings needed */
for (next_eo = options; next_eo->envName; next_eo++) for (next_eo = options; next_eo->envName; next_eo++)
{ {

View File

@ -235,6 +235,8 @@ typedef enum
/* (this is used only for 2.0-protocol connections) */ /* (this is used only for 2.0-protocol connections) */
typedef enum typedef enum
{ {
SETENV_STATE_CLIENT_ENCODING_SEND, /* About to send an Environment Option */
SETENV_STATE_CLIENT_ENCODING_WAIT, /* Waiting for above send to complete */
SETENV_STATE_OPTION_SEND, /* About to send an Environment Option */ SETENV_STATE_OPTION_SEND, /* About to send an Environment Option */
SETENV_STATE_OPTION_WAIT, /* Waiting for above send to complete */ SETENV_STATE_OPTION_WAIT, /* Waiting for above send to complete */
SETENV_STATE_QUERY1_SEND, /* About to send a status query */ SETENV_STATE_QUERY1_SEND, /* About to send a status query */
@ -293,6 +295,7 @@ struct pg_conn
char *pgtty; /* tty on which the backend messages is char *pgtty; /* tty on which the backend messages is
* displayed (OBSOLETE, NOT USED) */ * displayed (OBSOLETE, NOT USED) */
char *connect_timeout; /* connection timeout (numeric string) */ char *connect_timeout; /* connection timeout (numeric string) */
char *client_encoding_initial; /* encoding to use */
char *pgoptions; /* options to start the backend with */ char *pgoptions; /* options to start the backend with */
char *appname; /* application name */ char *appname; /* application name */
char *fbappname; /* fallback application name */ char *fbappname; /* fallback application name */