/*------------------------------------------------------------------------- * * preptlist.c * Routines to preprocess the parse tree target list * * For INSERT and UPDATE queries, the targetlist must contain an entry for * each attribute of the target relation in the correct order. For all query * types, we may need to add junk tlist entries for Vars used in the RETURNING * list and row ID information needed for SELECT FOR UPDATE locking and/or * EvalPlanQual checking. * * The rewriter's rewriteTargetListIU and rewriteTargetListUD routines * also do preprocessing of the targetlist. The division of labor between * here and there is partially historical, but it's not entirely arbitrary. * In particular, consider an UPDATE across an inheritance tree. What the * rewriter does need be done only once (because it depends only on the * properties of the parent relation). What's done here has to be done over * again for each child relation, because it depends on the column list of * the child, which might have more columns and/or a different column order * than the parent. * * The fact that rewriteTargetListIU sorts non-resjunk tlist entries by column * position, which expand_targetlist depends on, violates the above comment * because the sorting is only valid for the parent relation. In inherited * UPDATE cases, adjust_inherited_tlist runs in between to take care of fixing * the tlists for child tables to keep expand_targetlist happy. We do it like * that because it's faster in typical non-inherited cases. * * Portions Copyright (c) 2012-2014, TransLattice, Inc. * Portions Copyright (c) 1996-2017, PostgreSQL Global Development Group * Portions Copyright (c) 1994, Regents of the University of California * * IDENTIFICATION * src/backend/optimizer/prep/preptlist.c * *------------------------------------------------------------------------- */ #include "postgres.h" #include "access/heapam.h" #include "access/sysattr.h" #include "catalog/pg_type.h" #include "nodes/makefuncs.h" #ifdef XCP #include "nodes/nodeFuncs.h" #include "optimizer/clauses.h" #endif #include "optimizer/prep.h" #include "optimizer/tlist.h" #include "optimizer/var.h" #include "parser/parsetree.h" #include "parser/parse_coerce.h" #include "utils/rel.h" static List *expand_targetlist(List *tlist, int command_type, Index result_relation, List *range_table); /* * preprocess_targetlist * Driver for preprocessing the parse tree targetlist. * * Returns the new targetlist. */ List * preprocess_targetlist(PlannerInfo *root, List *tlist) { Query *parse = root->parse; int result_relation = parse->resultRelation; List *range_table = parse->rtable; CmdType command_type = parse->commandType; ListCell *lc; /* * Sanity check: if there is a result relation, it'd better be a real * relation not a subquery. Else parser or rewriter messed up. */ if (result_relation) { RangeTblEntry *rte = rt_fetch(result_relation, range_table); if (rte->subquery != NULL || rte->relid == InvalidOid) elog(ERROR, "subquery cannot be result relation"); } /* * for heap_form_tuple to work, the targetlist must match the exact order * of the attributes. We also need to fill in any missing attributes. -ay * 10/94 */ if (command_type == CMD_INSERT || command_type == CMD_UPDATE) tlist = expand_targetlist(tlist, command_type, result_relation, range_table); #ifdef XCP /* * If target relation is specified set distribution of the plan */ if (result_relation) { Relation rel = heap_open(getrelid(result_relation, range_table), NoLock); RelationLocInfo *rel_loc_info = rel->rd_locator_info; /* Is target table distributed ? */ if (rel_loc_info) { Distribution *distribution = makeNode(Distribution); ListCell *lc; distribution->distributionType = rel_loc_info->locatorType; foreach(lc, rel_loc_info->rl_nodeList) distribution->nodes = bms_add_member(distribution->nodes, lfirst_int(lc)); distribution->restrictNodes = NULL; if (rel_loc_info->partAttrNum) { /* * For INSERT and UPDATE plan tlist is matching the target table * layout */ if (command_type == CMD_INSERT || command_type == CMD_UPDATE) { TargetEntry *keyTle; keyTle = (TargetEntry *) list_nth(tlist, rel_loc_info->partAttrNum - 1); distribution->distributionExpr = (Node *) keyTle->expr; /* * We can restrict the distribution if the expression * is evaluated to a constant */ if (command_type == CMD_INSERT) { Oid keytype; Const *constExpr = NULL; keytype = exprType(distribution->distributionExpr); constExpr = (Const *) eval_const_expressions(root, distribution->distributionExpr); if (IsA(constExpr, Const) && constExpr->consttype == keytype) { List *nodeList = NIL; Bitmapset *tmpset = bms_copy(distribution->nodes); Bitmapset *restrictinfo = NULL; Locator *locator; int *nodenums; int i, count; while((i = bms_first_member(tmpset)) >= 0) nodeList = lappend_int(nodeList, i); bms_free(tmpset); locator = createLocator(distribution->distributionType, RELATION_ACCESS_INSERT, keytype, LOCATOR_LIST_LIST, 0, (void *) nodeList, (void **) &nodenums, false); count = GET_NODES(locator, constExpr->constvalue, constExpr->constisnull, NULL); for (i = 0; i < count; i++) restrictinfo = bms_add_member(restrictinfo, nodenums[i]); distribution->restrictNodes = restrictinfo; list_free(nodeList); freeLocator(locator); } } } /* * For delete we need to add the partitioning key of the target * table to the tlist, so distribution can be correctly handled * trough all the planning process. */ if (command_type == CMD_DELETE) { Form_pg_attribute att_tup; TargetEntry *tle; Var *var; att_tup = rel->rd_att->attrs[rel_loc_info->partAttrNum - 1]; var = makeVar(result_relation, rel_loc_info->partAttrNum, att_tup->atttypid, att_tup->atttypmod, att_tup->attcollation, 0); tle = makeTargetEntry((Expr *) var, list_length(tlist) + 1, pstrdup(NameStr(att_tup->attname)), true); tlist = lappend(tlist, tle); distribution->distributionExpr = (Node *) var; } } else distribution->distributionExpr = NULL; root->distribution = distribution; } else root->distribution = NULL; heap_close(rel, NoLock); } #endif /* * Add necessary junk columns for rowmarked rels. These values are needed * for locking of rels selected FOR UPDATE/SHARE, and to do EvalPlanQual * rechecking. See comments for PlanRowMark in plannodes.h. */ foreach(lc, root->rowMarks) { PlanRowMark *rc = (PlanRowMark *) lfirst(lc); Var *var; char resname[32]; TargetEntry *tle; /* child rels use the same junk attrs as their parents */ if (rc->rti != rc->prti) continue; if (rc->allMarkTypes & ~(1 << ROW_MARK_COPY)) { /* Need to fetch TID */ var = makeVar(rc->rti, SelfItemPointerAttributeNumber, TIDOID, -1, InvalidOid, 0); snprintf(resname, sizeof(resname), "ctid%u", rc->rowmarkId); tle = makeTargetEntry((Expr *) var, list_length(tlist) + 1, pstrdup(resname), true); tlist = lappend(tlist, tle); } if (rc->allMarkTypes & (1 << ROW_MARK_COPY)) { /* Need the whole row as a junk var */ var = makeWholeRowVar(rt_fetch(rc->rti, range_table), rc->rti, 0, false); snprintf(resname, sizeof(resname), "wholerow%u", rc->rowmarkId); tle = makeTargetEntry((Expr *) var, list_length(tlist) + 1, pstrdup(resname), true); tlist = lappend(tlist, tle); } /* If parent of inheritance tree, always fetch the tableoid too. */ if (rc->isParent) { var = makeVar(rc->rti, TableOidAttributeNumber, OIDOID, -1, InvalidOid, 0); snprintf(resname, sizeof(resname), "tableoid%u", rc->rowmarkId); tle = makeTargetEntry((Expr *) var, list_length(tlist) + 1, pstrdup(resname), true); tlist = lappend(tlist, tle); } } /* * If the query has a RETURNING list, add resjunk entries for any Vars * used in RETURNING that belong to other relations. We need to do this * to make these Vars available for the RETURNING calculation. Vars that * belong to the result rel don't need to be added, because they will be * made to refer to the actual heap tuple. */ if (parse->returningList && list_length(parse->rtable) > 1) { List *vars; ListCell *l; vars = pull_var_clause((Node *) parse->returningList, PVC_RECURSE_AGGREGATES | PVC_RECURSE_WINDOWFUNCS | PVC_INCLUDE_PLACEHOLDERS); foreach(l, vars) { Var *var = (Var *) lfirst(l); TargetEntry *tle; if (IsA(var, Var) && var->varno == result_relation) continue; /* don't need it */ if (tlist_member((Expr *) var, tlist)) continue; /* already got it */ tle = makeTargetEntry((Expr *) var, list_length(tlist) + 1, NULL, true); tlist = lappend(tlist, tle); } list_free(vars); } return tlist; } /* * preprocess_onconflict_targetlist * Process ON CONFLICT SET targetlist. * * Returns the new targetlist. */ List * preprocess_onconflict_targetlist(List *tlist, int result_relation, List *range_table) { return expand_targetlist(tlist, CMD_UPDATE, result_relation, range_table); } /***************************************************************************** * * TARGETLIST EXPANSION * *****************************************************************************/ /* * expand_targetlist * Given a target list as generated by the parser and a result relation, * add targetlist entries for any missing attributes, and ensure the * non-junk attributes appear in proper field order. */ static List * expand_targetlist(List *tlist, int command_type, Index result_relation, List *range_table) { List *new_tlist = NIL; ListCell *tlist_item; Relation rel; int attrno, numattrs; tlist_item = list_head(tlist); /* * The rewriter should have already ensured that the TLEs are in correct * order; but we have to insert TLEs for any missing attributes. * * Scan the tuple description in the relation's relcache entry to make * sure we have all the user attributes in the right order. We assume * that the rewriter already acquired at least AccessShareLock on the * relation, so we need no lock here. */ rel = heap_open(getrelid(result_relation, range_table), NoLock); numattrs = RelationGetNumberOfAttributes(rel); for (attrno = 1; attrno <= numattrs; attrno++) { Form_pg_attribute att_tup = rel->rd_att->attrs[attrno - 1]; TargetEntry *new_tle = NULL; if (tlist_item != NULL) { TargetEntry *old_tle = (TargetEntry *) lfirst(tlist_item); if (!old_tle->resjunk && old_tle->resno == attrno) { new_tle = old_tle; tlist_item = lnext(tlist_item); } } if (new_tle == NULL) { /* * Didn't find a matching tlist entry, so make one. * * For INSERT, generate a NULL constant. (We assume the rewriter * would have inserted any available default value.) Also, if the * column isn't dropped, apply any domain constraints that might * exist --- this is to catch domain NOT NULL. * * For UPDATE, generate a Var reference to the existing value of * the attribute, so that it gets copied to the new tuple. But * generate a NULL for dropped columns (we want to drop any old * values). * * When generating a NULL constant for a dropped column, we label * it INT4 (any other guaranteed-to-exist datatype would do as * well). We can't label it with the dropped column's datatype * since that might not exist anymore. It does not really matter * what we claim the type is, since NULL is NULL --- its * representation is datatype-independent. This could perhaps * confuse code comparing the finished plan to the target * relation, however. */ Oid atttype = att_tup->atttypid; int32 atttypmod = att_tup->atttypmod; Oid attcollation = att_tup->attcollation; Node *new_expr; switch (command_type) { case CMD_INSERT: if (!att_tup->attisdropped) { new_expr = (Node *) makeConst(atttype, -1, attcollation, att_tup->attlen, (Datum) 0, true, /* isnull */ att_tup->attbyval); new_expr = coerce_to_domain(new_expr, InvalidOid, -1, atttype, COERCE_IMPLICIT_CAST, -1, false, false); } else { /* Insert NULL for dropped column */ new_expr = (Node *) makeConst(INT4OID, -1, InvalidOid, sizeof(int32), (Datum) 0, true, /* isnull */ true /* byval */ ); } break; case CMD_UPDATE: if (!att_tup->attisdropped) { new_expr = (Node *) makeVar(result_relation, attrno, atttype, atttypmod, attcollation, 0); } else { /* Insert NULL for dropped column */ new_expr = (Node *) makeConst(INT4OID, -1, InvalidOid, sizeof(int32), (Datum) 0, true, /* isnull */ true /* byval */ ); } break; default: elog(ERROR, "unrecognized command_type: %d", (int) command_type); new_expr = NULL; /* keep compiler quiet */ break; } new_tle = makeTargetEntry((Expr *) new_expr, attrno, pstrdup(NameStr(att_tup->attname)), false); } new_tlist = lappend(new_tlist, new_tle); } /* * The remaining tlist entries should be resjunk; append them all to the * end of the new tlist, making sure they have resnos higher than the last * real attribute. (Note: although the rewriter already did such * renumbering, we have to do it again here in case we are doing an UPDATE * in a table with dropped columns, or an inheritance child table with * extra columns.) */ while (tlist_item) { TargetEntry *old_tle = (TargetEntry *) lfirst(tlist_item); if (!old_tle->resjunk) elog(ERROR, "targetlist is not sorted correctly"); /* Get the resno right, but don't copy unnecessarily */ if (old_tle->resno != attrno) { old_tle = flatCopyTargetEntry(old_tle); old_tle->resno = attrno; } new_tlist = lappend(new_tlist, old_tle); attrno++; tlist_item = lnext(tlist_item); } heap_close(rel, NoLock); return new_tlist; } /* * Locate PlanRowMark for given RT index, or return NULL if none * * This probably ought to be elsewhere, but there's no very good place */ PlanRowMark * get_plan_rowmark(List *rowmarks, Index rtindex) { ListCell *l; foreach(l, rowmarks) { PlanRowMark *rc = (PlanRowMark *) lfirst(l); if (rc->rti == rtindex) return rc; } return NULL; }