mirror of
https://git.postgresql.org/git/postgresql.git
synced 2024-11-21 03:13:05 +08:00
postgres_fdw: Push down joins to remote servers.
If we've got a relatively straightforward join between two tables, this pushes that join down to the remote server instead of fetching the rows for each table and performing the join locally. Some cases are not handled yet, such as SEMI and ANTI joins. Also, we don't yet attempt to create presorted join paths or parameterized join paths even though these options do get tried for a base relation scan. Nevertheless, this seems likely to be a very significant win in many practical cases. Shigeru Hanada and Ashutosh Bapat, reviewed by Robert Haas, with additional review at various points by Tom Lane, Etsuro Fujita, KaiGai Kohei, and Jeevan Chalke.
This commit is contained in:
parent
7351e18286
commit
e4106b2528
@ -44,10 +44,12 @@
|
||||
#include "catalog/pg_proc.h"
|
||||
#include "catalog/pg_type.h"
|
||||
#include "commands/defrem.h"
|
||||
#include "nodes/makefuncs.h"
|
||||
#include "nodes/nodeFuncs.h"
|
||||
#include "nodes/plannodes.h"
|
||||
#include "optimizer/clauses.h"
|
||||
#include "optimizer/prep.h"
|
||||
#include "optimizer/tlist.h"
|
||||
#include "optimizer/var.h"
|
||||
#include "parser/parsetree.h"
|
||||
#include "utils/builtins.h"
|
||||
@ -96,6 +98,11 @@ typedef struct deparse_expr_cxt
|
||||
List **params_list; /* exprs that will become remote Params */
|
||||
} deparse_expr_cxt;
|
||||
|
||||
#define REL_ALIAS_PREFIX "r"
|
||||
/* Handy macro to add relation name qualification */
|
||||
#define ADD_REL_QUALIFIER(buf, varno) \
|
||||
appendStringInfo((buf), "%s%d.", REL_ALIAS_PREFIX, (varno))
|
||||
|
||||
/*
|
||||
* Functions to determine whether an expression can be evaluated safely on
|
||||
* remote server.
|
||||
@ -114,14 +121,17 @@ static void deparseTargetList(StringInfo buf,
|
||||
Relation rel,
|
||||
bool is_returning,
|
||||
Bitmapset *attrs_used,
|
||||
bool qualify_col,
|
||||
List **retrieved_attrs);
|
||||
static void deparseExplicitTargetList(List *tlist, List **retrieved_attrs,
|
||||
deparse_expr_cxt *context);
|
||||
static void deparseReturningList(StringInfo buf, PlannerInfo *root,
|
||||
Index rtindex, Relation rel,
|
||||
bool trig_after_row,
|
||||
List *returningList,
|
||||
List **retrieved_attrs);
|
||||
static void deparseColumnRef(StringInfo buf, int varno, int varattno,
|
||||
PlannerInfo *root);
|
||||
PlannerInfo *root, bool qualify_col);
|
||||
static void deparseRelation(StringInfo buf, Relation rel);
|
||||
static void deparseExpr(Expr *expr, deparse_expr_cxt *context);
|
||||
static void deparseVar(Var *node, deparse_expr_cxt *context);
|
||||
@ -142,11 +152,13 @@ static void printRemoteParam(int paramindex, Oid paramtype, int32 paramtypmod,
|
||||
deparse_expr_cxt *context);
|
||||
static void printRemotePlaceholder(Oid paramtype, int32 paramtypmod,
|
||||
deparse_expr_cxt *context);
|
||||
static void deparseSelectSql(Bitmapset *attrs_used, List **retrieved_attrs,
|
||||
static void deparseSelectSql(List *tlist, List **retrieved_attrs,
|
||||
deparse_expr_cxt *context);
|
||||
static void deparseLockingClause(deparse_expr_cxt *context);
|
||||
static void appendWhereClause(List *exprs, deparse_expr_cxt *context);
|
||||
static void appendOrderByClause(List *pathkeys, deparse_expr_cxt *context);
|
||||
static void appendConditions(List *exprs, deparse_expr_cxt *context);
|
||||
static void deparseFromExprForRel(StringInfo buf, PlannerInfo *root,
|
||||
RelOptInfo *joinrel, bool use_alias, List **params_list);
|
||||
|
||||
|
||||
/*
|
||||
@ -269,7 +281,7 @@ foreign_expr_walker(Node *node,
|
||||
* Param's collation, ie it's not safe for it to have a
|
||||
* non-default collation.
|
||||
*/
|
||||
if (var->varno == glob_cxt->foreignrel->relid &&
|
||||
if (bms_is_member(var->varno, glob_cxt->foreignrel->relids) &&
|
||||
var->varlevelsup == 0)
|
||||
{
|
||||
/* Var belongs to foreign table */
|
||||
@ -703,43 +715,80 @@ deparse_type_name(Oid type_oid, int32 typemod)
|
||||
return format_type_with_typemod_qualified(type_oid, typemod);
|
||||
}
|
||||
|
||||
/*
|
||||
* Build the targetlist for given relation to be deparsed as SELECT clause.
|
||||
*
|
||||
* The output targetlist contains the columns that need to be fetched from the
|
||||
* foreign server for the given relation.
|
||||
*/
|
||||
List *
|
||||
build_tlist_to_deparse(RelOptInfo *foreignrel)
|
||||
{
|
||||
List *tlist = NIL;
|
||||
PgFdwRelationInfo *fpinfo = (PgFdwRelationInfo *) foreignrel->fdw_private;
|
||||
|
||||
/*
|
||||
* We require columns specified in foreignrel->reltargetlist and those
|
||||
* required for evaluating the local conditions.
|
||||
*/
|
||||
tlist = add_to_flat_tlist(tlist, foreignrel->reltargetlist);
|
||||
tlist = add_to_flat_tlist(tlist,
|
||||
pull_var_clause((Node *) fpinfo->local_conds,
|
||||
PVC_REJECT_AGGREGATES,
|
||||
PVC_RECURSE_PLACEHOLDERS));
|
||||
|
||||
return tlist;
|
||||
}
|
||||
|
||||
/*
|
||||
* Deparse SELECT statement for given relation into buf.
|
||||
*
|
||||
* tlist contains the list of desired columns to be fetched from foreign server.
|
||||
* For a base relation fpinfo->attrs_used is used to construct SELECT clause,
|
||||
* hence the tlist is ignored for a base relation.
|
||||
*
|
||||
* remote_conds is the list of conditions to be deparsed as WHERE clause.
|
||||
*
|
||||
* pathkeys is the list of pathkeys to order the result by.
|
||||
*
|
||||
* List of columns selected is returned in retrieved_attrs.
|
||||
*
|
||||
* If params_list is not NULL, it receives a list of Params and other-relation
|
||||
* Vars used in the clauses; these values must be transmitted to the remote
|
||||
* server as parameter values.
|
||||
*
|
||||
* If params_list is NULL, we're generating the query for EXPLAIN purposes,
|
||||
* so Params and other-relation Vars should be replaced by dummy values.
|
||||
*
|
||||
* pathkeys is the list of pathkeys to order the result by.
|
||||
*
|
||||
* List of columns selected is returned in retrieved_attrs.
|
||||
*/
|
||||
extern void
|
||||
deparseSelectStmtForRel(StringInfo buf, PlannerInfo *root, RelOptInfo *rel,
|
||||
List *remote_conds, List *pathkeys,
|
||||
List *tlist, List *remote_conds, List *pathkeys,
|
||||
List **retrieved_attrs, List **params_list)
|
||||
{
|
||||
PgFdwRelationInfo *fpinfo = (PgFdwRelationInfo *) rel->fdw_private;
|
||||
deparse_expr_cxt context;
|
||||
|
||||
/* Initialize params_list if caller needs one */
|
||||
if (params_list)
|
||||
*params_list = NIL;
|
||||
/* We handle relations for foreign tables and joins between those */
|
||||
Assert(rel->reloptkind == RELOPT_JOINREL ||
|
||||
rel->reloptkind == RELOPT_BASEREL ||
|
||||
rel->reloptkind == RELOPT_OTHER_MEMBER_REL);
|
||||
|
||||
/* Fill portions of context common to join and base relation */
|
||||
context.buf = buf;
|
||||
context.root = root;
|
||||
context.foreignrel = rel;
|
||||
context.params_list = params_list;
|
||||
|
||||
deparseSelectSql(fpinfo->attrs_used, retrieved_attrs, &context);
|
||||
/* Construct SELECT clause and FROM clause */
|
||||
deparseSelectSql(tlist, retrieved_attrs, &context);
|
||||
|
||||
/*
|
||||
* Construct WHERE clause
|
||||
*/
|
||||
if (remote_conds)
|
||||
appendWhereClause(remote_conds, &context);
|
||||
{
|
||||
appendStringInfo(buf, " WHERE ");
|
||||
appendConditions(remote_conds, &context);
|
||||
}
|
||||
|
||||
/* Add ORDER BY clause if we found any useful pathkeys */
|
||||
if (pathkeys)
|
||||
@ -752,41 +801,58 @@ deparseSelectStmtForRel(StringInfo buf, PlannerInfo *root, RelOptInfo *rel,
|
||||
/*
|
||||
* Construct a simple SELECT statement that retrieves desired columns
|
||||
* of the specified foreign table, and append it to "buf". The output
|
||||
* contains just "SELECT ... FROM tablename".
|
||||
* contains just "SELECT ... FROM ....".
|
||||
*
|
||||
* We also create an integer List of the columns being retrieved, which is
|
||||
* returned to *retrieved_attrs.
|
||||
*
|
||||
* tlist is the list of desired columns. Read prologue of
|
||||
* deparseSelectStmtForRel() for details.
|
||||
*/
|
||||
static void
|
||||
deparseSelectSql(Bitmapset *attrs_used, List **retrieved_attrs,
|
||||
deparse_expr_cxt *context)
|
||||
deparseSelectSql(List *tlist, List **retrieved_attrs, deparse_expr_cxt *context)
|
||||
{
|
||||
StringInfo buf = context->buf;
|
||||
RelOptInfo *foreignrel = context->foreignrel;
|
||||
PlannerInfo *root = context->root;
|
||||
RangeTblEntry *rte = planner_rt_fetch(foreignrel->relid, root);
|
||||
Relation rel;
|
||||
|
||||
/*
|
||||
* Core code already has some lock on each rel being planned, so we can
|
||||
* use NoLock here.
|
||||
*/
|
||||
rel = heap_open(rte->relid, NoLock);
|
||||
PgFdwRelationInfo *fpinfo = (PgFdwRelationInfo *) foreignrel->fdw_private;
|
||||
|
||||
/*
|
||||
* Construct SELECT list
|
||||
*/
|
||||
appendStringInfoString(buf, "SELECT ");
|
||||
deparseTargetList(buf, root, foreignrel->relid, rel, false, attrs_used,
|
||||
retrieved_attrs);
|
||||
|
||||
if (foreignrel->reloptkind == RELOPT_JOINREL)
|
||||
{
|
||||
/* For a join relation use the input tlist */
|
||||
deparseExplicitTargetList(tlist, retrieved_attrs, context);
|
||||
}
|
||||
else
|
||||
{
|
||||
/*
|
||||
* For a base relation fpinfo->attrs_used gives the list of columns
|
||||
* required to be fetched from the foreign server.
|
||||
*/
|
||||
RangeTblEntry *rte = planner_rt_fetch(foreignrel->relid, root);
|
||||
|
||||
/*
|
||||
* Core code already has some lock on each rel being planned, so we
|
||||
* can use NoLock here.
|
||||
*/
|
||||
Relation rel = heap_open(rte->relid, NoLock);
|
||||
|
||||
deparseTargetList(buf, root, foreignrel->relid, rel, false,
|
||||
fpinfo->attrs_used, false, retrieved_attrs);
|
||||
heap_close(rel, NoLock);
|
||||
}
|
||||
|
||||
/*
|
||||
* Construct FROM clause
|
||||
*/
|
||||
appendStringInfoString(buf, " FROM ");
|
||||
deparseRelation(buf, rel);
|
||||
|
||||
heap_close(rel, NoLock);
|
||||
deparseFromExprForRel(buf, root, foreignrel,
|
||||
(foreignrel->reloptkind == RELOPT_JOINREL),
|
||||
context->params_list);
|
||||
}
|
||||
|
||||
/*
|
||||
@ -796,6 +862,8 @@ deparseSelectSql(Bitmapset *attrs_used, List **retrieved_attrs,
|
||||
*
|
||||
* The tlist text is appended to buf, and we also create an integer List
|
||||
* of the columns being retrieved, which is returned to *retrieved_attrs.
|
||||
*
|
||||
* If qualify_col is true, add relation alias before the column name.
|
||||
*/
|
||||
static void
|
||||
deparseTargetList(StringInfo buf,
|
||||
@ -804,6 +872,7 @@ deparseTargetList(StringInfo buf,
|
||||
Relation rel,
|
||||
bool is_returning,
|
||||
Bitmapset *attrs_used,
|
||||
bool qualify_col,
|
||||
List **retrieved_attrs)
|
||||
{
|
||||
TupleDesc tupdesc = RelationGetDescr(rel);
|
||||
@ -836,7 +905,7 @@ deparseTargetList(StringInfo buf,
|
||||
appendStringInfoString(buf, " RETURNING ");
|
||||
first = false;
|
||||
|
||||
deparseColumnRef(buf, rtindex, i, root);
|
||||
deparseColumnRef(buf, rtindex, i, root, qualify_col);
|
||||
|
||||
*retrieved_attrs = lappend_int(*retrieved_attrs, i);
|
||||
}
|
||||
@ -855,6 +924,8 @@ deparseTargetList(StringInfo buf,
|
||||
appendStringInfoString(buf, " RETURNING ");
|
||||
first = false;
|
||||
|
||||
if (qualify_col)
|
||||
ADD_REL_QUALIFIER(buf, rtindex);
|
||||
appendStringInfoString(buf, "ctid");
|
||||
|
||||
*retrieved_attrs = lappend_int(*retrieved_attrs,
|
||||
@ -876,64 +947,81 @@ deparseLockingClause(deparse_expr_cxt *context)
|
||||
StringInfo buf = context->buf;
|
||||
PlannerInfo *root = context->root;
|
||||
RelOptInfo *rel = context->foreignrel;
|
||||
int relid = -1;
|
||||
|
||||
/*
|
||||
* Add FOR UPDATE/SHARE if appropriate. We apply locking during the
|
||||
* initial row fetch, rather than later on as is done for local tables.
|
||||
* The extra roundtrips involved in trying to duplicate the local
|
||||
* semantics exactly don't seem worthwhile (see also comments for
|
||||
* RowMarkType).
|
||||
*
|
||||
* Note: because we actually run the query as a cursor, this assumes that
|
||||
* DECLARE CURSOR ... FOR UPDATE is supported, which it isn't before 8.3.
|
||||
*/
|
||||
if (rel->relid == root->parse->resultRelation &&
|
||||
(root->parse->commandType == CMD_UPDATE ||
|
||||
root->parse->commandType == CMD_DELETE))
|
||||
while ((relid = bms_next_member(rel->relids, relid)) >= 0)
|
||||
{
|
||||
/* Relation is UPDATE/DELETE target, so use FOR UPDATE */
|
||||
appendStringInfoString(buf, " FOR UPDATE");
|
||||
}
|
||||
else
|
||||
{
|
||||
PlanRowMark *rc = get_plan_rowmark(root->rowMarks, rel->relid);
|
||||
|
||||
if (rc)
|
||||
/*
|
||||
* Add FOR UPDATE/SHARE if appropriate. We apply locking during the
|
||||
* initial row fetch, rather than later on as is done for local
|
||||
* tables. The extra roundtrips involved in trying to duplicate the
|
||||
* local semantics exactly don't seem worthwhile (see also comments
|
||||
* for RowMarkType).
|
||||
*
|
||||
* Note: because we actually run the query as a cursor, this assumes
|
||||
* that DECLARE CURSOR ... FOR UPDATE is supported, which it isn't
|
||||
* before 8.3.
|
||||
*/
|
||||
if (relid == root->parse->resultRelation &&
|
||||
(root->parse->commandType == CMD_UPDATE ||
|
||||
root->parse->commandType == CMD_DELETE))
|
||||
{
|
||||
/*
|
||||
* Relation is specified as a FOR UPDATE/SHARE target, so handle
|
||||
* that. (But we could also see LCS_NONE, meaning this isn't a
|
||||
* target relation after all.)
|
||||
*
|
||||
* For now, just ignore any [NO] KEY specification, since (a) it's
|
||||
* not clear what that means for a remote table that we don't have
|
||||
* complete information about, and (b) it wouldn't work anyway on
|
||||
* older remote servers. Likewise, we don't worry about NOWAIT.
|
||||
*/
|
||||
switch (rc->strength)
|
||||
/* Relation is UPDATE/DELETE target, so use FOR UPDATE */
|
||||
appendStringInfoString(buf, " FOR UPDATE");
|
||||
|
||||
/* Add the relation alias if we are here for a join relation */
|
||||
if (rel->reloptkind == RELOPT_JOINREL)
|
||||
appendStringInfo(buf, " OF %s%d", REL_ALIAS_PREFIX, relid);
|
||||
}
|
||||
else
|
||||
{
|
||||
PlanRowMark *rc = get_plan_rowmark(root->rowMarks, relid);
|
||||
|
||||
if (rc)
|
||||
{
|
||||
case LCS_NONE:
|
||||
/* No locking needed */
|
||||
break;
|
||||
case LCS_FORKEYSHARE:
|
||||
case LCS_FORSHARE:
|
||||
appendStringInfoString(buf, " FOR SHARE");
|
||||
break;
|
||||
case LCS_FORNOKEYUPDATE:
|
||||
case LCS_FORUPDATE:
|
||||
appendStringInfoString(buf, " FOR UPDATE");
|
||||
break;
|
||||
/*
|
||||
* Relation is specified as a FOR UPDATE/SHARE target, so
|
||||
* handle that. (But we could also see LCS_NONE, meaning this
|
||||
* isn't a target relation after all.)
|
||||
*
|
||||
* For now, just ignore any [NO] KEY specification, since (a)
|
||||
* it's not clear what that means for a remote table that we
|
||||
* don't have complete information about, and (b) it wouldn't
|
||||
* work anyway on older remote servers. Likewise, we don't
|
||||
* worry about NOWAIT.
|
||||
*/
|
||||
switch (rc->strength)
|
||||
{
|
||||
case LCS_NONE:
|
||||
/* No locking needed */
|
||||
break;
|
||||
case LCS_FORKEYSHARE:
|
||||
case LCS_FORSHARE:
|
||||
appendStringInfoString(buf, " FOR SHARE");
|
||||
break;
|
||||
case LCS_FORNOKEYUPDATE:
|
||||
case LCS_FORUPDATE:
|
||||
appendStringInfoString(buf, " FOR UPDATE");
|
||||
break;
|
||||
}
|
||||
|
||||
/* Add the relation alias if we are here for a join relation */
|
||||
if (rel->reloptkind == RELOPT_JOINREL &&
|
||||
rc->strength != LCS_NONE)
|
||||
appendStringInfo(buf, " OF %s%d", REL_ALIAS_PREFIX, relid);
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
/*
|
||||
* Deparse WHERE clauses in given list of RestrictInfos and append them to
|
||||
* context->buf.
|
||||
* Deparse conditions from the provided list and append them to buf.
|
||||
*
|
||||
* The conditions in the list are assumed to be ANDed. This function is used to
|
||||
* deparse both WHERE clauses and JOIN .. ON clauses.
|
||||
*/
|
||||
static void
|
||||
appendWhereClause(List *exprs, deparse_expr_cxt *context)
|
||||
appendConditions(List *exprs, deparse_expr_cxt *context)
|
||||
{
|
||||
int nestlevel;
|
||||
ListCell *lc;
|
||||
@ -945,16 +1033,25 @@ appendWhereClause(List *exprs, deparse_expr_cxt *context)
|
||||
|
||||
foreach(lc, exprs)
|
||||
{
|
||||
RestrictInfo *ri = (RestrictInfo *) lfirst(lc);
|
||||
Expr *expr = (Expr *) lfirst(lc);
|
||||
|
||||
/*
|
||||
* Extract clause from RestrictInfo, if required. See comments in
|
||||
* declaration of PgFdwRelationInfo for details.
|
||||
*/
|
||||
if (IsA(expr, RestrictInfo))
|
||||
{
|
||||
RestrictInfo *ri = (RestrictInfo *) expr;
|
||||
|
||||
expr = ri->clause;
|
||||
}
|
||||
|
||||
/* Connect expressions with "AND" and parenthesize each condition. */
|
||||
if (is_first)
|
||||
appendStringInfoString(buf, " WHERE ");
|
||||
else
|
||||
if (!is_first)
|
||||
appendStringInfoString(buf, " AND ");
|
||||
|
||||
appendStringInfoChar(buf, '(');
|
||||
deparseExpr(ri->clause, context);
|
||||
deparseExpr(expr, context);
|
||||
appendStringInfoChar(buf, ')');
|
||||
|
||||
is_first = false;
|
||||
@ -963,6 +1060,156 @@ appendWhereClause(List *exprs, deparse_expr_cxt *context)
|
||||
reset_transmission_modes(nestlevel);
|
||||
}
|
||||
|
||||
/* Output join name for given join type */
|
||||
extern const char *
|
||||
get_jointype_name(JoinType jointype)
|
||||
{
|
||||
switch (jointype)
|
||||
{
|
||||
case JOIN_INNER:
|
||||
return "INNER";
|
||||
|
||||
case JOIN_LEFT:
|
||||
return "LEFT";
|
||||
|
||||
case JOIN_RIGHT:
|
||||
return "RIGHT";
|
||||
|
||||
case JOIN_FULL:
|
||||
return "FULL";
|
||||
|
||||
default:
|
||||
/* Shouldn't come here, but protect from buggy code. */
|
||||
elog(ERROR, "unsupported join type %d", jointype);
|
||||
}
|
||||
|
||||
/* Keep compiler happy */
|
||||
return NULL;
|
||||
}
|
||||
|
||||
/*
|
||||
* Deparse given targetlist and append it to context->buf.
|
||||
*
|
||||
* tlist is list of TargetEntry's which in turn contain Var nodes.
|
||||
*
|
||||
* retrieved_attrs is the list of continuously increasing integers starting
|
||||
* from 1. It has same number of entries as tlist.
|
||||
*/
|
||||
static void
|
||||
deparseExplicitTargetList(List *tlist, List **retrieved_attrs,
|
||||
deparse_expr_cxt *context)
|
||||
{
|
||||
ListCell *lc;
|
||||
StringInfo buf = context->buf;
|
||||
int i = 0;
|
||||
|
||||
*retrieved_attrs = NIL;
|
||||
|
||||
foreach(lc, tlist)
|
||||
{
|
||||
TargetEntry *tle = (TargetEntry *) lfirst(lc);
|
||||
Var *var;
|
||||
|
||||
/* Extract expression if TargetEntry node */
|
||||
Assert(IsA(tle, TargetEntry));
|
||||
var = (Var *) tle->expr;
|
||||
/* We expect only Var nodes here */
|
||||
Assert(IsA(var, Var));
|
||||
|
||||
if (i > 0)
|
||||
appendStringInfoString(buf, ", ");
|
||||
deparseVar(var, context);
|
||||
|
||||
*retrieved_attrs = lappend_int(*retrieved_attrs, i + 1);
|
||||
|
||||
i++;
|
||||
}
|
||||
|
||||
if (i == 0)
|
||||
appendStringInfoString(buf, "NULL");
|
||||
}
|
||||
|
||||
/*
|
||||
* Construct FROM clause for given relation
|
||||
*
|
||||
* The function constructs ... JOIN ... ON ... for join relation. For a base
|
||||
* relation it just returns schema-qualified tablename, with the appropriate
|
||||
* alias if so requested.
|
||||
*/
|
||||
void
|
||||
deparseFromExprForRel(StringInfo buf, PlannerInfo *root, RelOptInfo *foreignrel,
|
||||
bool use_alias, List **params_list)
|
||||
{
|
||||
PgFdwRelationInfo *fpinfo = (PgFdwRelationInfo *) foreignrel->fdw_private;
|
||||
|
||||
if (foreignrel->reloptkind == RELOPT_JOINREL)
|
||||
{
|
||||
RelOptInfo *rel_o = fpinfo->outerrel;
|
||||
RelOptInfo *rel_i = fpinfo->innerrel;
|
||||
StringInfoData join_sql_o;
|
||||
StringInfoData join_sql_i;
|
||||
|
||||
/* Deparse outer relation */
|
||||
initStringInfo(&join_sql_o);
|
||||
deparseFromExprForRel(&join_sql_o, root, rel_o, true, params_list);
|
||||
|
||||
/* Deparse inner relation */
|
||||
initStringInfo(&join_sql_i);
|
||||
deparseFromExprForRel(&join_sql_i, root, rel_i, true, params_list);
|
||||
|
||||
/*
|
||||
* For a join relation FROM clause entry is deparsed as
|
||||
*
|
||||
* ((outer relation) <join type> (inner relation) ON (joinclauses)
|
||||
*/
|
||||
appendStringInfo(buf, "(%s %s JOIN %s ON ", join_sql_o.data,
|
||||
get_jointype_name(fpinfo->jointype), join_sql_i.data);
|
||||
|
||||
/* Append join clause; (TRUE) if no join clause */
|
||||
if (fpinfo->joinclauses)
|
||||
{
|
||||
deparse_expr_cxt context;
|
||||
|
||||
context.buf = buf;
|
||||
context.foreignrel = foreignrel;
|
||||
context.root = root;
|
||||
context.params_list = params_list;
|
||||
|
||||
appendStringInfo(buf, "(");
|
||||
appendConditions(fpinfo->joinclauses, &context);
|
||||
appendStringInfo(buf, ")");
|
||||
}
|
||||
else
|
||||
appendStringInfoString(buf, "(TRUE)");
|
||||
|
||||
/* End the FROM clause entry. */
|
||||
appendStringInfo(buf, ")");
|
||||
}
|
||||
else
|
||||
{
|
||||
RangeTblEntry *rte = planner_rt_fetch(foreignrel->relid, root);
|
||||
|
||||
/*
|
||||
* Core code already has some lock on each rel being planned, so we
|
||||
* can use NoLock here.
|
||||
*/
|
||||
Relation rel = heap_open(rte->relid, NoLock);
|
||||
|
||||
deparseRelation(buf, rel);
|
||||
|
||||
/*
|
||||
* Add a unique alias to avoid any conflict in relation names due to
|
||||
* pulled up subqueries in the query being built for a pushed down
|
||||
* join.
|
||||
*/
|
||||
if (use_alias)
|
||||
appendStringInfo(buf, " %s%d", REL_ALIAS_PREFIX, foreignrel->relid);
|
||||
|
||||
heap_close(rel, NoLock);
|
||||
}
|
||||
return;
|
||||
}
|
||||
|
||||
/*
|
||||
* deparse remote INSERT statement
|
||||
*
|
||||
@ -996,7 +1243,7 @@ deparseInsertSql(StringInfo buf, PlannerInfo *root,
|
||||
appendStringInfoString(buf, ", ");
|
||||
first = false;
|
||||
|
||||
deparseColumnRef(buf, rtindex, attnum, root);
|
||||
deparseColumnRef(buf, rtindex, attnum, root, false);
|
||||
}
|
||||
|
||||
appendStringInfoString(buf, ") VALUES (");
|
||||
@ -1057,7 +1304,7 @@ deparseUpdateSql(StringInfo buf, PlannerInfo *root,
|
||||
appendStringInfoString(buf, ", ");
|
||||
first = false;
|
||||
|
||||
deparseColumnRef(buf, rtindex, attnum, root);
|
||||
deparseColumnRef(buf, rtindex, attnum, root, false);
|
||||
appendStringInfo(buf, " = $%d", pindex);
|
||||
pindex++;
|
||||
}
|
||||
@ -1120,7 +1367,7 @@ deparseReturningList(StringInfo buf, PlannerInfo *root,
|
||||
}
|
||||
|
||||
if (attrs_used != NULL)
|
||||
deparseTargetList(buf, root, rtindex, rel, true, attrs_used,
|
||||
deparseTargetList(buf, root, rtindex, rel, true, attrs_used, false,
|
||||
retrieved_attrs);
|
||||
else
|
||||
*retrieved_attrs = NIL;
|
||||
@ -1212,45 +1459,97 @@ deparseAnalyzeSql(StringInfo buf, Relation rel, List **retrieved_attrs)
|
||||
/*
|
||||
* Construct name to use for given column, and emit it into buf.
|
||||
* If it has a column_name FDW option, use that instead of attribute name.
|
||||
*
|
||||
* If qualify_col is true, qualify column name with the alias of relation.
|
||||
*/
|
||||
static void
|
||||
deparseColumnRef(StringInfo buf, int varno, int varattno, PlannerInfo *root)
|
||||
deparseColumnRef(StringInfo buf, int varno, int varattno, PlannerInfo *root,
|
||||
bool qualify_col)
|
||||
{
|
||||
RangeTblEntry *rte;
|
||||
char *colname = NULL;
|
||||
List *options;
|
||||
ListCell *lc;
|
||||
|
||||
/* varno must not be any of OUTER_VAR, INNER_VAR and INDEX_VAR. */
|
||||
Assert(!IS_SPECIAL_VARNO(varno));
|
||||
|
||||
/* Get RangeTblEntry from array in PlannerInfo. */
|
||||
rte = planner_rt_fetch(varno, root);
|
||||
|
||||
/*
|
||||
* If it's a column of a foreign table, and it has the column_name FDW
|
||||
* option, use that value.
|
||||
*/
|
||||
options = GetForeignColumnOptions(rte->relid, varattno);
|
||||
foreach(lc, options)
|
||||
/* varattno can be a whole-row reference, ctid or a regular table column */
|
||||
if (varattno == SelfItemPointerAttributeNumber)
|
||||
{
|
||||
DefElem *def = (DefElem *) lfirst(lc);
|
||||
|
||||
if (strcmp(def->defname, "column_name") == 0)
|
||||
{
|
||||
colname = defGetString(def);
|
||||
break;
|
||||
}
|
||||
if (qualify_col)
|
||||
ADD_REL_QUALIFIER(buf, varno);
|
||||
appendStringInfoString(buf, "ctid");
|
||||
}
|
||||
else if (varattno == 0)
|
||||
{
|
||||
/* Whole row reference */
|
||||
Relation rel;
|
||||
Bitmapset *attrs_used;
|
||||
|
||||
/*
|
||||
* If it's a column of a regular table or it doesn't have column_name FDW
|
||||
* option, use attribute name.
|
||||
*/
|
||||
if (colname == NULL)
|
||||
colname = get_relid_attribute_name(rte->relid, varattno);
|
||||
/* Required only to be passed down to deparseTargetList(). */
|
||||
List *retrieved_attrs;
|
||||
|
||||
appendStringInfoString(buf, quote_identifier(colname));
|
||||
/* Get RangeTblEntry from array in PlannerInfo. */
|
||||
rte = planner_rt_fetch(varno, root);
|
||||
|
||||
/*
|
||||
* The lock on the relation will be held by upper callers, so it's
|
||||
* fine to open it with no lock here.
|
||||
*/
|
||||
rel = heap_open(rte->relid, NoLock);
|
||||
|
||||
/*
|
||||
* The local name of the foreign table can not be recognized by the
|
||||
* foreign server and the table it references on foreign server might
|
||||
* have different column ordering or different columns than those
|
||||
* declared locally. Hence we have to deparse whole-row reference as
|
||||
* ROW(columns referenced locally). Construct this by deparsing a
|
||||
* "whole row" attribute.
|
||||
*/
|
||||
attrs_used = bms_add_member(NULL,
|
||||
0 - FirstLowInvalidHeapAttributeNumber);
|
||||
appendStringInfoString(buf, "ROW(");
|
||||
deparseTargetList(buf, root, varno, rel, false, attrs_used, qualify_col,
|
||||
&retrieved_attrs);
|
||||
appendStringInfoString(buf, ")");
|
||||
heap_close(rel, NoLock);
|
||||
bms_free(attrs_used);
|
||||
}
|
||||
else
|
||||
{
|
||||
char *colname = NULL;
|
||||
List *options;
|
||||
ListCell *lc;
|
||||
|
||||
/* varno must not be any of OUTER_VAR, INNER_VAR and INDEX_VAR. */
|
||||
Assert(!IS_SPECIAL_VARNO(varno));
|
||||
|
||||
/* Get RangeTblEntry from array in PlannerInfo. */
|
||||
rte = planner_rt_fetch(varno, root);
|
||||
|
||||
/*
|
||||
* If it's a column of a foreign table, and it has the column_name FDW
|
||||
* option, use that value.
|
||||
*/
|
||||
options = GetForeignColumnOptions(rte->relid, varattno);
|
||||
foreach(lc, options)
|
||||
{
|
||||
DefElem *def = (DefElem *) lfirst(lc);
|
||||
|
||||
if (strcmp(def->defname, "column_name") == 0)
|
||||
{
|
||||
colname = defGetString(def);
|
||||
break;
|
||||
}
|
||||
}
|
||||
|
||||
/*
|
||||
* If it's a column of a regular table or it doesn't have column_name
|
||||
* FDW option, use attribute name.
|
||||
*/
|
||||
if (colname == NULL)
|
||||
colname = get_relid_attribute_name(rte->relid, varattno);
|
||||
|
||||
if (qualify_col)
|
||||
ADD_REL_QUALIFIER(buf, varno);
|
||||
|
||||
appendStringInfoString(buf, quote_identifier(colname));
|
||||
}
|
||||
}
|
||||
|
||||
/*
|
||||
@ -1395,14 +1694,12 @@ deparseExpr(Expr *node, deparse_expr_cxt *context)
|
||||
static void
|
||||
deparseVar(Var *node, deparse_expr_cxt *context)
|
||||
{
|
||||
StringInfo buf = context->buf;
|
||||
bool qualify_col = (context->foreignrel->reloptkind == RELOPT_JOINREL);
|
||||
|
||||
if (node->varno == context->foreignrel->relid &&
|
||||
if (bms_is_member(node->varno, context->foreignrel->relids) &&
|
||||
node->varlevelsup == 0)
|
||||
{
|
||||
/* Var belongs to foreign table */
|
||||
deparseColumnRef(buf, node->varno, node->varattno, context->root);
|
||||
}
|
||||
deparseColumnRef(context->buf, node->varno, node->varattno,
|
||||
context->root, qualify_col);
|
||||
else
|
||||
{
|
||||
/* Treat like a Param */
|
||||
|
File diff suppressed because it is too large
Load Diff
File diff suppressed because it is too large
Load Diff
@ -26,7 +26,25 @@
|
||||
*/
|
||||
typedef struct PgFdwRelationInfo
|
||||
{
|
||||
/* baserestrictinfo clauses, broken down into safe and unsafe subsets. */
|
||||
/*
|
||||
* True means that the relation can be pushed down. Always true for simple
|
||||
* foreign scan.
|
||||
*/
|
||||
bool pushdown_safe;
|
||||
|
||||
/*
|
||||
* Restriction clauses, divided into safe and unsafe to pushdown subsets.
|
||||
*
|
||||
* For a base foreign relation this is a list of clauses along-with
|
||||
* RestrictInfo wrapper. Keeping RestrictInfo wrapper helps while dividing
|
||||
* scan_clauses in postgresGetForeignPlan into safe and unsafe subsets.
|
||||
* Also it helps in estimating costs since RestrictInfo caches the
|
||||
* selectivity and qual cost for the clause in it.
|
||||
*
|
||||
* For a join relation, however, they are part of otherclause list
|
||||
* obtained from extract_actual_join_clauses, which strips RestrictInfo
|
||||
* construct. So, for a join relation they are list of bare clauses.
|
||||
*/
|
||||
List *remote_conds;
|
||||
List *local_conds;
|
||||
|
||||
@ -37,11 +55,17 @@ typedef struct PgFdwRelationInfo
|
||||
QualCost local_conds_cost;
|
||||
Selectivity local_conds_sel;
|
||||
|
||||
/* Estimated size and cost for a scan with baserestrictinfo quals. */
|
||||
/* Selectivity of join conditions */
|
||||
Selectivity joinclause_sel;
|
||||
|
||||
/* Estimated size and cost for a scan or join. */
|
||||
double rows;
|
||||
int width;
|
||||
Cost startup_cost;
|
||||
Cost total_cost;
|
||||
/* Costs excluding costs for transferring data from the foreign server */
|
||||
Cost rel_startup_cost;
|
||||
Cost rel_total_cost;
|
||||
|
||||
/* Options extracted from catalogs. */
|
||||
bool use_remote_estimate;
|
||||
@ -55,6 +79,19 @@ typedef struct PgFdwRelationInfo
|
||||
UserMapping *user; /* only set in use_remote_estimate mode */
|
||||
|
||||
int fetch_size; /* fetch size for this remote table */
|
||||
|
||||
/*
|
||||
* Name of the relation while EXPLAINing ForeignScan. It is used for join
|
||||
* relations but is set for all relations. For join relation, the name
|
||||
* indicates which foreign tables are being joined and the join type used.
|
||||
*/
|
||||
StringInfo relation_name;
|
||||
|
||||
/* Join information */
|
||||
RelOptInfo *outerrel;
|
||||
RelOptInfo *innerrel;
|
||||
JoinType jointype;
|
||||
List *joinclauses;
|
||||
} PgFdwRelationInfo;
|
||||
|
||||
/* in postgres_fdw.c */
|
||||
@ -102,12 +139,15 @@ extern void deparseAnalyzeSql(StringInfo buf, Relation rel,
|
||||
List **retrieved_attrs);
|
||||
extern void deparseStringLiteral(StringInfo buf, const char *val);
|
||||
extern Expr *find_em_expr_for_rel(EquivalenceClass *ec, RelOptInfo *rel);
|
||||
extern List *build_tlist_to_deparse(RelOptInfo *foreign_rel);
|
||||
extern void deparseSelectStmtForRel(StringInfo buf, PlannerInfo *root,
|
||||
RelOptInfo *baserel, List *remote_conds, List *pathkeys,
|
||||
RelOptInfo *foreignrel, List *tlist,
|
||||
List *remote_conds, List *pathkeys,
|
||||
List **retrieved_attrs, List **params_list);
|
||||
|
||||
/* in shippable.c */
|
||||
extern bool is_builtin(Oid objectId);
|
||||
extern bool is_shippable(Oid objectId, Oid classId, PgFdwRelationInfo *fpinfo);
|
||||
extern const char *get_jointype_name(JoinType jointype);
|
||||
|
||||
#endif /* POSTGRES_FDW_H */
|
||||
|
@ -11,12 +11,17 @@ DO $d$
|
||||
OPTIONS (dbname '$$||current_database()||$$',
|
||||
port '$$||current_setting('port')||$$'
|
||||
)$$;
|
||||
EXECUTE $$CREATE SERVER loopback2 FOREIGN DATA WRAPPER postgres_fdw
|
||||
OPTIONS (dbname '$$||current_database()||$$',
|
||||
port '$$||current_setting('port')||$$'
|
||||
)$$;
|
||||
END;
|
||||
$d$;
|
||||
|
||||
CREATE USER MAPPING FOR public SERVER testserver1
|
||||
OPTIONS (user 'value', password 'value');
|
||||
CREATE USER MAPPING FOR CURRENT_USER SERVER loopback;
|
||||
CREATE USER MAPPING FOR CURRENT_USER SERVER loopback2;
|
||||
|
||||
-- ===================================================================
|
||||
-- create objects used through FDW loopback server
|
||||
@ -39,6 +44,18 @@ CREATE TABLE "S 1"."T 2" (
|
||||
c2 text,
|
||||
CONSTRAINT t2_pkey PRIMARY KEY (c1)
|
||||
);
|
||||
CREATE TABLE "S 1"."T 3" (
|
||||
c1 int NOT NULL,
|
||||
c2 int NOT NULL,
|
||||
c3 text,
|
||||
CONSTRAINT t3_pkey PRIMARY KEY (c1)
|
||||
);
|
||||
CREATE TABLE "S 1"."T 4" (
|
||||
c1 int NOT NULL,
|
||||
c2 int NOT NULL,
|
||||
c3 text,
|
||||
CONSTRAINT t4_pkey PRIMARY KEY (c1)
|
||||
);
|
||||
|
||||
INSERT INTO "S 1"."T 1"
|
||||
SELECT id,
|
||||
@ -54,9 +71,23 @@ INSERT INTO "S 1"."T 2"
|
||||
SELECT id,
|
||||
'AAA' || to_char(id, 'FM000')
|
||||
FROM generate_series(1, 100) id;
|
||||
INSERT INTO "S 1"."T 3"
|
||||
SELECT id,
|
||||
id + 1,
|
||||
'AAA' || to_char(id, 'FM000')
|
||||
FROM generate_series(1, 100) id;
|
||||
DELETE FROM "S 1"."T 3" WHERE c1 % 2 != 0; -- delete for outer join tests
|
||||
INSERT INTO "S 1"."T 4"
|
||||
SELECT id,
|
||||
id + 1,
|
||||
'AAA' || to_char(id, 'FM000')
|
||||
FROM generate_series(1, 100) id;
|
||||
DELETE FROM "S 1"."T 4" WHERE c1 % 3 != 0; -- delete for outer join tests
|
||||
|
||||
ANALYZE "S 1"."T 1";
|
||||
ANALYZE "S 1"."T 2";
|
||||
ANALYZE "S 1"."T 3";
|
||||
ANALYZE "S 1"."T 4";
|
||||
|
||||
-- ===================================================================
|
||||
-- create foreign tables
|
||||
@ -87,6 +118,24 @@ CREATE FOREIGN TABLE ft2 (
|
||||
) SERVER loopback;
|
||||
ALTER FOREIGN TABLE ft2 DROP COLUMN cx;
|
||||
|
||||
CREATE FOREIGN TABLE ft4 (
|
||||
c1 int NOT NULL,
|
||||
c2 int NOT NULL,
|
||||
c3 text
|
||||
) SERVER loopback OPTIONS (schema_name 'S 1', table_name 'T 3');
|
||||
|
||||
CREATE FOREIGN TABLE ft5 (
|
||||
c1 int NOT NULL,
|
||||
c2 int NOT NULL,
|
||||
c3 text
|
||||
) SERVER loopback OPTIONS (schema_name 'S 1', table_name 'T 4');
|
||||
|
||||
CREATE FOREIGN TABLE ft6 (
|
||||
c1 int NOT NULL,
|
||||
c2 int NOT NULL,
|
||||
c3 text
|
||||
) SERVER loopback2 OPTIONS (schema_name 'S 1', table_name 'T 4');
|
||||
|
||||
-- ===================================================================
|
||||
-- tests for validator
|
||||
-- ===================================================================
|
||||
@ -168,8 +217,6 @@ EXPLAIN (VERBOSE, COSTS false) SELECT * FROM ft1 t1 WHERE c1 = 102 FOR SHARE;
|
||||
SELECT * FROM ft1 t1 WHERE c1 = 102 FOR SHARE;
|
||||
-- aggregate
|
||||
SELECT COUNT(*) FROM ft1 t1;
|
||||
-- join two tables
|
||||
SELECT t1.c1 FROM ft1 t1 JOIN ft2 t2 ON (t1.c1 = t2.c1) ORDER BY t1.c3, t1.c1 OFFSET 100 LIMIT 10;
|
||||
-- subquery
|
||||
SELECT * FROM ft1 t1 WHERE t1.c3 IN (SELECT c3 FROM ft2 t2 WHERE c1 <= 10) ORDER BY c1;
|
||||
-- subquery+MAX
|
||||
@ -208,10 +255,11 @@ EXPLAIN (VERBOSE, COSTS false) SELECT * FROM ft1 t1 WHERE c1 = ANY(ARRAY[c2, 1,
|
||||
EXPLAIN (VERBOSE, COSTS false) SELECT * FROM ft1 t1 WHERE c1 = (ARRAY[c1,c2,3])[1]; -- ArrayRef
|
||||
EXPLAIN (VERBOSE, COSTS false) SELECT * FROM ft1 t1 WHERE c6 = E'foo''s\\bar'; -- check special chars
|
||||
EXPLAIN (VERBOSE, COSTS false) SELECT * FROM ft1 t1 WHERE c8 = 'foo'; -- can't be sent to remote
|
||||
-- parameterized remote path
|
||||
-- parameterized remote path for foreign table
|
||||
EXPLAIN (VERBOSE, COSTS false)
|
||||
SELECT * FROM ft2 a, ft2 b WHERE a.c1 = 47 AND b.c1 = a.c2;
|
||||
SELECT * FROM "S 1"."T 1" a, ft2 b WHERE a."C 1" = 47 AND b.c1 = a.c2;
|
||||
SELECT * FROM ft2 a, ft2 b WHERE a.c1 = 47 AND b.c1 = a.c2;
|
||||
|
||||
-- check both safe and unsafe join conditions
|
||||
EXPLAIN (VERBOSE, COSTS false)
|
||||
SELECT * FROM ft2 a, ft2 b
|
||||
@ -270,6 +318,158 @@ EXPLAIN (VERBOSE, COSTS false)
|
||||
SELECT count(c3) FROM ft1 t1 WHERE t1.c1 === t1.c2;
|
||||
SELECT count(c3) FROM ft1 t1 WHERE t1.c1 === t1.c2;
|
||||
|
||||
-- ===================================================================
|
||||
-- JOIN queries
|
||||
-- ===================================================================
|
||||
-- Analyze ft4 and ft5 so that we have better statistics. These tables do not
|
||||
-- have use_remote_estimate set.
|
||||
ANALYZE ft4;
|
||||
ANALYZE ft5;
|
||||
|
||||
-- join two tables
|
||||
EXPLAIN (COSTS false, VERBOSE)
|
||||
SELECT t1.c1, t2.c1 FROM ft1 t1 JOIN ft2 t2 ON (t1.c1 = t2.c1) ORDER BY t1.c3, t1.c1 OFFSET 100 LIMIT 10;
|
||||
SELECT t1.c1, t2.c1 FROM ft1 t1 JOIN ft2 t2 ON (t1.c1 = t2.c1) ORDER BY t1.c3, t1.c1 OFFSET 100 LIMIT 10;
|
||||
-- join three tables
|
||||
EXPLAIN (COSTS false, VERBOSE)
|
||||
SELECT t1.c1, t2.c2, t3.c3 FROM ft1 t1 JOIN ft2 t2 ON (t1.c1 = t2.c1) JOIN ft4 t3 ON (t3.c1 = t1.c1) ORDER BY t1.c3, t1.c1 OFFSET 10 LIMIT 10;
|
||||
SELECT t1.c1, t2.c2, t3.c3 FROM ft1 t1 JOIN ft2 t2 ON (t1.c1 = t2.c1) JOIN ft4 t3 ON (t3.c1 = t1.c1) ORDER BY t1.c3, t1.c1 OFFSET 10 LIMIT 10;
|
||||
-- left outer join
|
||||
EXPLAIN (COSTS false, VERBOSE)
|
||||
SELECT t1.c1, t2.c1 FROM ft4 t1 LEFT JOIN ft5 t2 ON (t1.c1 = t2.c1) ORDER BY t1.c1, t2.c1 OFFSET 10 LIMIT 10;
|
||||
SELECT t1.c1, t2.c1 FROM ft4 t1 LEFT JOIN ft5 t2 ON (t1.c1 = t2.c1) ORDER BY t1.c1, t2.c1 OFFSET 10 LIMIT 10;
|
||||
-- left outer join + placement of clauses.
|
||||
-- clauses within the nullable side are not pulled up, but top level clause on
|
||||
-- non-nullable side is pushed into non-nullable side
|
||||
EXPLAIN (COSTS false, VERBOSE)
|
||||
SELECT t1.c1, t1.c2, t2.c1, t2.c2 FROM ft4 t1 LEFT JOIN (SELECT * FROM ft5 WHERE c1 < 10) t2 ON (t1.c1 = t2.c1) WHERE t1.c1 < 10;
|
||||
SELECT t1.c1, t1.c2, t2.c1, t2.c2 FROM ft4 t1 LEFT JOIN (SELECT * FROM ft5 WHERE c1 < 10) t2 ON (t1.c1 = t2.c1) WHERE t1.c1 < 10;
|
||||
-- clauses within the nullable side are not pulled up, but the top level clause
|
||||
-- on nullable side is not pushed down into nullable side
|
||||
EXPLAIN (COSTS false, VERBOSE)
|
||||
SELECT t1.c1, t1.c2, t2.c1, t2.c2 FROM ft4 t1 LEFT JOIN (SELECT * FROM ft5 WHERE c1 < 10) t2 ON (t1.c1 = t2.c1)
|
||||
WHERE (t2.c1 < 10 OR t2.c1 IS NULL) AND t1.c1 < 10;
|
||||
SELECT t1.c1, t1.c2, t2.c1, t2.c2 FROM ft4 t1 LEFT JOIN (SELECT * FROM ft5 WHERE c1 < 10) t2 ON (t1.c1 = t2.c1)
|
||||
WHERE (t2.c1 < 10 OR t2.c1 IS NULL) AND t1.c1 < 10;
|
||||
-- right outer join
|
||||
EXPLAIN (COSTS false, VERBOSE)
|
||||
SELECT t1.c1, t2.c1 FROM ft5 t1 RIGHT JOIN ft4 t2 ON (t1.c1 = t2.c1) ORDER BY t2.c1, t1.c1 OFFSET 10 LIMIT 10;
|
||||
SELECT t1.c1, t2.c1 FROM ft5 t1 RIGHT JOIN ft4 t2 ON (t1.c1 = t2.c1) ORDER BY t2.c1, t1.c1 OFFSET 10 LIMIT 10;
|
||||
-- full outer join
|
||||
EXPLAIN (COSTS false, VERBOSE)
|
||||
SELECT t1.c1, t2.c1 FROM ft4 t1 FULL JOIN ft5 t2 ON (t1.c1 = t2.c1) ORDER BY t1.c1, t2.c1 OFFSET 45 LIMIT 10;
|
||||
SELECT t1.c1, t2.c1 FROM ft4 t1 FULL JOIN ft5 t2 ON (t1.c1 = t2.c1) ORDER BY t1.c1, t2.c1 OFFSET 45 LIMIT 10;
|
||||
-- full outer join + WHERE clause, only matched rows
|
||||
EXPLAIN (COSTS false, VERBOSE)
|
||||
SELECT t1.c1, t2.c1 FROM ft4 t1 FULL JOIN ft5 t2 ON (t1.c1 = t2.c1) WHERE (t1.c1 = t2.c1 OR t1.c1 IS NULL) ORDER BY t1.c1, t2.c1 OFFSET 10 LIMIT 10;
|
||||
SELECT t1.c1, t2.c1 FROM ft4 t1 FULL JOIN ft5 t2 ON (t1.c1 = t2.c1) WHERE (t1.c1 = t2.c1 OR t1.c1 IS NULL) ORDER BY t1.c1, t2.c1 OFFSET 10 LIMIT 10;
|
||||
-- join two tables with FOR UPDATE clause
|
||||
-- tests whole-row reference for row marks
|
||||
EXPLAIN (COSTS false, VERBOSE)
|
||||
SELECT t1.c1, t2.c1 FROM ft1 t1 JOIN ft2 t2 ON (t1.c1 = t2.c1) ORDER BY t1.c3, t1.c1 OFFSET 100 LIMIT 10 FOR UPDATE OF t1;
|
||||
SELECT t1.c1, t2.c1 FROM ft1 t1 JOIN ft2 t2 ON (t1.c1 = t2.c1) ORDER BY t1.c3, t1.c1 OFFSET 100 LIMIT 10 FOR UPDATE OF t1;
|
||||
EXPLAIN (COSTS false, VERBOSE)
|
||||
SELECT t1.c1, t2.c1 FROM ft1 t1 JOIN ft2 t2 ON (t1.c1 = t2.c1) ORDER BY t1.c3, t1.c1 OFFSET 100 LIMIT 10 FOR UPDATE;
|
||||
SELECT t1.c1, t2.c1 FROM ft1 t1 JOIN ft2 t2 ON (t1.c1 = t2.c1) ORDER BY t1.c3, t1.c1 OFFSET 100 LIMIT 10 FOR UPDATE;
|
||||
-- join two tables with FOR SHARE clause
|
||||
EXPLAIN (COSTS false, VERBOSE)
|
||||
SELECT t1.c1, t2.c1 FROM ft1 t1 JOIN ft2 t2 ON (t1.c1 = t2.c1) ORDER BY t1.c3, t1.c1 OFFSET 100 LIMIT 10 FOR SHARE OF t1;
|
||||
SELECT t1.c1, t2.c1 FROM ft1 t1 JOIN ft2 t2 ON (t1.c1 = t2.c1) ORDER BY t1.c3, t1.c1 OFFSET 100 LIMIT 10 FOR SHARE OF t1;
|
||||
EXPLAIN (COSTS false, VERBOSE)
|
||||
SELECT t1.c1, t2.c1 FROM ft1 t1 JOIN ft2 t2 ON (t1.c1 = t2.c1) ORDER BY t1.c3, t1.c1 OFFSET 100 LIMIT 10 FOR SHARE;
|
||||
SELECT t1.c1, t2.c1 FROM ft1 t1 JOIN ft2 t2 ON (t1.c1 = t2.c1) ORDER BY t1.c3, t1.c1 OFFSET 100 LIMIT 10 FOR SHARE;
|
||||
-- join in CTE
|
||||
EXPLAIN (COSTS false, VERBOSE)
|
||||
WITH t (c1_1, c1_3, c2_1) AS (SELECT t1.c1, t1.c3, t2.c1 FROM ft1 t1 JOIN ft2 t2 ON (t1.c1 = t2.c1)) SELECT c1_1, c2_1 FROM t ORDER BY c1_3, c1_1 OFFSET 100 LIMIT 10;
|
||||
WITH t (c1_1, c1_3, c2_1) AS (SELECT t1.c1, t1.c3, t2.c1 FROM ft1 t1 JOIN ft2 t2 ON (t1.c1 = t2.c1)) SELECT c1_1, c2_1 FROM t ORDER BY c1_3, c1_1 OFFSET 100 LIMIT 10;
|
||||
-- ctid with whole-row reference
|
||||
EXPLAIN (COSTS false, VERBOSE)
|
||||
SELECT t1.ctid, t1, t2, t1.c1 FROM ft1 t1 JOIN ft2 t2 ON (t1.c1 = t2.c1) ORDER BY t1.c3, t1.c1 OFFSET 100 LIMIT 10;
|
||||
SELECT t1.ctid, t1, t2, t1.c1 FROM ft1 t1 JOIN ft2 t2 ON (t1.c1 = t2.c1) ORDER BY t1.c3, t1.c1 OFFSET 100 LIMIT 10;
|
||||
-- SEMI JOIN, not pushed down
|
||||
EXPLAIN (COSTS false, VERBOSE)
|
||||
SELECT t1.c1 FROM ft1 t1 WHERE EXISTS (SELECT 1 FROM ft2 t2 WHERE t1.c1 = t2.c1) ORDER BY t1.c1 OFFSET 100 LIMIT 10;
|
||||
SELECT t1.c1 FROM ft1 t1 WHERE EXISTS (SELECT 1 FROM ft2 t2 WHERE t1.c1 = t2.c1) ORDER BY t1.c1 OFFSET 100 LIMIT 10;
|
||||
-- ANTI JOIN, not pushed down
|
||||
EXPLAIN (COSTS false, VERBOSE)
|
||||
SELECT t1.c1 FROM ft1 t1 WHERE NOT EXISTS (SELECT 1 FROM ft2 t2 WHERE t1.c1 = t2.c2) ORDER BY t1.c1 OFFSET 100 LIMIT 10;
|
||||
SELECT t1.c1 FROM ft1 t1 WHERE NOT EXISTS (SELECT 1 FROM ft2 t2 WHERE t1.c1 = t2.c2) ORDER BY t1.c1 OFFSET 100 LIMIT 10;
|
||||
-- CROSS JOIN, not pushed down
|
||||
EXPLAIN (COSTS false, VERBOSE)
|
||||
SELECT t1.c1, t2.c1 FROM ft1 t1 CROSS JOIN ft2 t2 ORDER BY t1.c1, t2.c1 OFFSET 100 LIMIT 10;
|
||||
SELECT t1.c1, t2.c1 FROM ft1 t1 CROSS JOIN ft2 t2 ORDER BY t1.c1, t2.c1 OFFSET 100 LIMIT 10;
|
||||
-- different server, not pushed down. No result expected.
|
||||
EXPLAIN (COSTS false, VERBOSE)
|
||||
SELECT t1.c1, t2.c1 FROM ft5 t1 JOIN ft6 t2 ON (t1.c1 = t2.c1) ORDER BY t1.c1, t2.c1 OFFSET 100 LIMIT 10;
|
||||
SELECT t1.c1, t2.c1 FROM ft5 t1 JOIN ft6 t2 ON (t1.c1 = t2.c1) ORDER BY t1.c1, t2.c1 OFFSET 100 LIMIT 10;
|
||||
-- unsafe join conditions (c8 has a UDT), not pushed down. Practically a CROSS
|
||||
-- JOIN since c8 in both tables has same value.
|
||||
EXPLAIN (COSTS false, VERBOSE)
|
||||
SELECT t1.c1, t2.c1 FROM ft1 t1 LEFT JOIN ft2 t2 ON (t1.c8 = t2.c8) ORDER BY t1.c1, t2.c1 OFFSET 100 LIMIT 10;
|
||||
SELECT t1.c1, t2.c1 FROM ft1 t1 LEFT JOIN ft2 t2 ON (t1.c8 = t2.c8) ORDER BY t1.c1, t2.c1 OFFSET 100 LIMIT 10;
|
||||
-- unsafe conditions on one side (c8 has a UDT), not pushed down.
|
||||
EXPLAIN (COSTS false, VERBOSE)
|
||||
SELECT t1.c1, t2.c1 FROM ft1 t1 LEFT JOIN ft2 t2 ON (t1.c1 = t2.c1) WHERE t1.c8 = 'foo' ORDER BY t1.c3, t1.c1 OFFSET 100 LIMIT 10;
|
||||
SELECT t1.c1, t2.c1 FROM ft1 t1 LEFT JOIN ft2 t2 ON (t1.c1 = t2.c1) WHERE t1.c8 = 'foo' ORDER BY t1.c3, t1.c1 OFFSET 100 LIMIT 10;
|
||||
-- join where unsafe to pushdown condition in WHERE clause has a column not
|
||||
-- in the SELECT clause. In this test unsafe clause needs to have column
|
||||
-- references from both joining sides so that the clause is not pushed down
|
||||
-- into one of the joining sides.
|
||||
EXPLAIN (COSTS false, VERBOSE)
|
||||
SELECT t1.c1, t2.c1 FROM ft1 t1 JOIN ft2 t2 ON (t1.c1 = t2.c1) WHERE t1.c8 = t2.c8 ORDER BY t1.c3, t1.c1 OFFSET 100 LIMIT 10;
|
||||
SELECT t1.c1, t2.c1 FROM ft1 t1 JOIN ft2 t2 ON (t1.c1 = t2.c1) WHERE t1.c8 = t2.c8 ORDER BY t1.c3, t1.c1 OFFSET 100 LIMIT 10;
|
||||
-- Aggregate after UNION, for testing setrefs
|
||||
EXPLAIN (COSTS false, VERBOSE)
|
||||
SELECT t1c1, avg(t1c1 + t2c1) FROM (SELECT t1.c1, t2.c1 FROM ft1 t1 JOIN ft2 t2 ON (t1.c1 = t2.c1) UNION SELECT t1.c1, t2.c1 FROM ft1 t1 JOIN ft2 t2 ON (t1.c1 = t2.c1)) AS t (t1c1, t2c1) GROUP BY t1c1 ORDER BY t1c1 OFFSET 100 LIMIT 10;
|
||||
SELECT t1c1, avg(t1c1 + t2c1) FROM (SELECT t1.c1, t2.c1 FROM ft1 t1 JOIN ft2 t2 ON (t1.c1 = t2.c1) UNION SELECT t1.c1, t2.c1 FROM ft1 t1 JOIN ft2 t2 ON (t1.c1 = t2.c1)) AS t (t1c1, t2c1) GROUP BY t1c1 ORDER BY t1c1 OFFSET 100 LIMIT 10;
|
||||
-- join with lateral reference
|
||||
EXPLAIN (COSTS false, VERBOSE)
|
||||
SELECT t1."C 1" FROM "S 1"."T 1" t1, LATERAL (SELECT DISTINCT t2.c1, t3.c1 FROM ft1 t2, ft2 t3 WHERE t2.c1 = t3.c1 AND t2.c2 = t1.c2) q ORDER BY t1."C 1" OFFSET 10 LIMIT 10;
|
||||
SELECT t1."C 1" FROM "S 1"."T 1" t1, LATERAL (SELECT DISTINCT t2.c1, t3.c1 FROM ft1 t2, ft2 t3 WHERE t2.c1 = t3.c1 AND t2.c2 = t1.c2) q ORDER BY t1."C 1" OFFSET 10 LIMIT 10;
|
||||
|
||||
-- create another user for permission, user mapping, effective user tests
|
||||
CREATE USER view_owner;
|
||||
-- grant privileges on ft4 and ft5 to view_owner
|
||||
GRANT ALL ON ft4 TO view_owner;
|
||||
GRANT ALL ON ft5 TO view_owner;
|
||||
-- prepare statement with current session user
|
||||
PREPARE join_stmt AS SELECT t1.c1, t2.c1 FROM ft4 t1 LEFT JOIN ft5 t2 ON (t1.c1 = t2.c1) ORDER BY t1.c1, t2.c1 OFFSET 10 LIMIT 10;
|
||||
EXPLAIN (COSTS OFF, VERBOSE) EXECUTE join_stmt;
|
||||
EXECUTE join_stmt;
|
||||
-- change the session user to view_owner and execute the statement. Because of
|
||||
-- change in session user, the plan should get invalidated and created again.
|
||||
-- While creating the plan, it should throw error since there is no user mapping
|
||||
-- available for view_owner.
|
||||
SET SESSION ROLE view_owner;
|
||||
EXPLAIN (COSTS OFF, VERBOSE) EXECUTE join_stmt;
|
||||
EXECUTE join_stmt;
|
||||
RESET ROLE;
|
||||
DEALLOCATE join_stmt;
|
||||
|
||||
CREATE VIEW v_ft5 AS SELECT * FROM ft5;
|
||||
-- change owner of v_ft5 to view_owner so that the effective user for scan on
|
||||
-- ft5 is view_owner and not the current user.
|
||||
ALTER VIEW v_ft5 OWNER TO view_owner;
|
||||
-- create a public user mapping for loopback server
|
||||
-- drop user mapping for current_user.
|
||||
DROP USER MAPPING FOR CURRENT_USER SERVER loopback;
|
||||
CREATE USER MAPPING FOR PUBLIC SERVER loopback;
|
||||
-- different effective user for permission check, but same user mapping for the
|
||||
-- joining sides, join pushed down, no result expected.
|
||||
PREPARE join_stmt AS SELECT t1.c1, t2.c1 FROM ft5 t1 JOIN v_ft5 t2 ON (t1.c1 = t2.c1) ORDER BY t1.c1, t2.c1 OFFSET 100 LIMIT 10;
|
||||
EXPLAIN (COSTS false, VERBOSE) EXECUTE join_stmt;
|
||||
EXECUTE join_stmt;
|
||||
-- create user mapping for view_owner and execute the prepared statement
|
||||
-- the join should not be pushed down since joining relations now use two
|
||||
-- different user mappings
|
||||
CREATE USER MAPPING FOR view_owner SERVER loopback;
|
||||
EXPLAIN (COSTS false, VERBOSE) EXECUTE join_stmt;
|
||||
EXECUTE join_stmt;
|
||||
|
||||
-- recreate the dropped user mapping for further tests
|
||||
CREATE USER MAPPING FOR CURRENT_USER SERVER loopback;
|
||||
DROP USER MAPPING FOR PUBLIC SERVER loopback;
|
||||
|
||||
-- ===================================================================
|
||||
-- parameterized queries
|
||||
-- ===================================================================
|
||||
@ -348,6 +548,7 @@ DROP FUNCTION f_test(int);
|
||||
-- ===================================================================
|
||||
ALTER FOREIGN TABLE ft1 ALTER COLUMN c8 TYPE int;
|
||||
SELECT * FROM ft1 WHERE c1 = 1; -- ERROR
|
||||
SELECT ft1.c1, ft2.c2, ft1.c8 FROM ft1, ft2 WHERE ft1.c1 = ft2.c1 AND ft1.c1 = 1; -- ERROR
|
||||
ALTER FOREIGN TABLE ft1 ALTER COLUMN c8 TYPE user_enum;
|
||||
|
||||
-- ===================================================================
|
||||
@ -973,3 +1174,7 @@ WHERE ftrelid = 'table30000'::regclass
|
||||
AND ftoptions @> array['fetch_size=60000'];
|
||||
|
||||
ROLLBACK;
|
||||
|
||||
-- Cleanup
|
||||
DROP OWNED BY view_owner;
|
||||
DROP USER view_owner;
|
||||
|
@ -486,6 +486,16 @@
|
||||
be <literal>IMMUTABLE</> as well.
|
||||
</para>
|
||||
|
||||
<para>
|
||||
When <filename>postgres_fdw</> encounters a join between foreign tables on
|
||||
the same foreign server, it sends the entire join to the foreign server,
|
||||
unless for some reason it believes that it will be more efficient to fetch
|
||||
rows from each table individually, or unless the table references involved
|
||||
are subject to different user mappings. While sending the <literal>JOIN</>
|
||||
clauses, it takes the same precautions as mentioned above for the
|
||||
<literal>WHERE</> clauses.
|
||||
</para>
|
||||
|
||||
<para>
|
||||
The query that is actually sent to the remote server for execution can
|
||||
be examined using <command>EXPLAIN VERBOSE</>.
|
||||
|
Loading…
Reference in New Issue
Block a user