mirror of
				https://github.com/postgres/postgres.git
				synced 2025-10-25 13:17:41 +03:00 
			
		
		
		
	Don't reuse slots between root and partition in ON CONFLICT ... UPDATE.
Until now the the slot to store the conflicting tuple, and the result of the ON CONFLICT SET, where reused between partitions. That necessitated changing slots descriptor when switching partitions. Besides the overhead of switching descriptors on a slot (which requires memory allocations and prevents JITing), that's importantly also problematic for tableam. There individual partitions might belong to different tableams, needing different kinds of slots. In passing also fix ExecOnConflictUpdate to clear the existing slot at exit. Otherwise that slot could continue to hold a pin till the query ends, which could be far too long if the input data set is large, and there's no further conflicts. While previously also problematic, it's now more important as there will be more such slots when partitioned. Author: Andres Freund Reviewed-By: Robert Haas, David Rowley Discussion: https://postgr.es/m/20180703070645.wchpu5muyto5n647@alap3.anarazel.de
This commit is contained in:
		| @@ -723,28 +723,55 @@ ExecInitPartitionInfo(ModifyTableState *mtstate, EState *estate, | |||||||
| 		if (node->onConflictAction == ONCONFLICT_UPDATE) | 		if (node->onConflictAction == ONCONFLICT_UPDATE) | ||||||
| 		{ | 		{ | ||||||
| 			TupleConversionMap *map; | 			TupleConversionMap *map; | ||||||
|  | 			TupleDesc	leaf_desc; | ||||||
|  |  | ||||||
| 			map = leaf_part_rri->ri_PartitionInfo->pi_RootToPartitionMap; | 			map = leaf_part_rri->ri_PartitionInfo->pi_RootToPartitionMap; | ||||||
|  | 			leaf_desc = RelationGetDescr(leaf_part_rri->ri_RelationDesc); | ||||||
|  |  | ||||||
| 			Assert(node->onConflictSet != NIL); | 			Assert(node->onConflictSet != NIL); | ||||||
| 			Assert(rootResultRelInfo->ri_onConflict != NULL); | 			Assert(rootResultRelInfo->ri_onConflict != NULL); | ||||||
|  |  | ||||||
|  | 			leaf_part_rri->ri_onConflict = makeNode(OnConflictSetState); | ||||||
|  |  | ||||||
|  | 			/* | ||||||
|  | 			 * Need a separate existing slot for each partition, as the | ||||||
|  | 			 * partition could be of a different AM, even if the tuple | ||||||
|  | 			 * descriptors match. | ||||||
|  | 			 */ | ||||||
|  | 			leaf_part_rri->ri_onConflict->oc_Existing = | ||||||
|  | 				ExecInitExtraTupleSlot(mtstate->ps.state, | ||||||
|  | 									   leaf_desc, | ||||||
|  | 									   &TTSOpsBufferHeapTuple); | ||||||
|  |  | ||||||
| 			/* | 			/* | ||||||
| 			 * If the partition's tuple descriptor matches exactly the root | 			 * If the partition's tuple descriptor matches exactly the root | ||||||
| 			 * parent (the common case), we can simply re-use the parent's ON | 			 * parent (the common case), we can re-use most of the parent's ON | ||||||
| 			 * CONFLICT SET state, skipping a bunch of work.  Otherwise, we | 			 * CONFLICT SET state, skipping a bunch of work.  Otherwise, we | ||||||
| 			 * need to create state specific to this partition. | 			 * need to create state specific to this partition. | ||||||
| 			 */ | 			 */ | ||||||
| 			if (map == NULL) | 			if (map == NULL) | ||||||
| 				leaf_part_rri->ri_onConflict = rootResultRelInfo->ri_onConflict; | 			{ | ||||||
|  | 				/* | ||||||
|  | 				 * It's safe to reuse these from the partition root, as we | ||||||
|  | 				 * only process one tuple at a time (therefore we won't | ||||||
|  | 				 * overwrite needed data in slots), and the results of | ||||||
|  | 				 * projections are independent of the underlying | ||||||
|  | 				 * storage. Projections and where clauses themselves don't | ||||||
|  | 				 * store state / are independent of the underlying storage. | ||||||
|  | 				 */ | ||||||
|  | 				leaf_part_rri->ri_onConflict->oc_ProjSlot = | ||||||
|  | 					rootResultRelInfo->ri_onConflict->oc_ProjSlot; | ||||||
|  | 				leaf_part_rri->ri_onConflict->oc_ProjInfo = | ||||||
|  | 					rootResultRelInfo->ri_onConflict->oc_ProjInfo; | ||||||
|  | 				leaf_part_rri->ri_onConflict->oc_WhereClause = | ||||||
|  | 					rootResultRelInfo->ri_onConflict->oc_WhereClause; | ||||||
|  | 			} | ||||||
| 			else | 			else | ||||||
| 			{ | 			{ | ||||||
| 				List	   *onconflset; | 				List	   *onconflset; | ||||||
| 				TupleDesc	tupDesc; | 				TupleDesc	tupDesc; | ||||||
| 				bool		found_whole_row; | 				bool		found_whole_row; | ||||||
|  |  | ||||||
| 				leaf_part_rri->ri_onConflict = makeNode(OnConflictSetState); |  | ||||||
|  |  | ||||||
| 				/* | 				/* | ||||||
| 				 * Translate expressions in onConflictSet to account for | 				 * Translate expressions in onConflictSet to account for | ||||||
| 				 * different attribute numbers.  For that, map partition | 				 * different attribute numbers.  For that, map partition | ||||||
| @@ -778,20 +805,17 @@ ExecInitPartitionInfo(ModifyTableState *mtstate, EState *estate, | |||||||
| 				/* Finally, adjust this tlist to match the partition. */ | 				/* Finally, adjust this tlist to match the partition. */ | ||||||
| 				onconflset = adjust_partition_tlist(onconflset, map); | 				onconflset = adjust_partition_tlist(onconflset, map); | ||||||
|  |  | ||||||
| 				/* | 				/* create the tuple slot for the UPDATE SET projection */ | ||||||
| 				 * Build UPDATE SET's projection info.  The user of this |  | ||||||
| 				 * projection is responsible for setting the slot's tupdesc! |  | ||||||
| 				 * We set aside a tupdesc that's good for the common case of a |  | ||||||
| 				 * partition that's tupdesc-equal to the partitioned table; |  | ||||||
| 				 * partitions of different tupdescs must generate their own. |  | ||||||
| 				 */ |  | ||||||
| 				tupDesc = ExecTypeFromTL(onconflset); | 				tupDesc = ExecTypeFromTL(onconflset); | ||||||
| 				ExecSetSlotDescriptor(mtstate->mt_conflproj, tupDesc); | 				leaf_part_rri->ri_onConflict->oc_ProjSlot = | ||||||
|  | 					ExecInitExtraTupleSlot(mtstate->ps.state, tupDesc, | ||||||
|  | 										   &TTSOpsVirtual); | ||||||
|  |  | ||||||
|  | 				/* build UPDATE SET projection state */ | ||||||
| 				leaf_part_rri->ri_onConflict->oc_ProjInfo = | 				leaf_part_rri->ri_onConflict->oc_ProjInfo = | ||||||
| 					ExecBuildProjectionInfo(onconflset, econtext, | 					ExecBuildProjectionInfo(onconflset, econtext, | ||||||
| 											mtstate->mt_conflproj, | 											leaf_part_rri->ri_onConflict->oc_ProjSlot, | ||||||
| 											&mtstate->ps, partrelDesc); | 											&mtstate->ps, partrelDesc); | ||||||
| 				leaf_part_rri->ri_onConflict->oc_ProjTupdesc = tupDesc; |  | ||||||
|  |  | ||||||
| 				/* | 				/* | ||||||
| 				 * If there is a WHERE clause, initialize state where it will | 				 * If there is a WHERE clause, initialize state where it will | ||||||
|   | |||||||
| @@ -1304,6 +1304,7 @@ ExecOnConflictUpdate(ModifyTableState *mtstate, | |||||||
| 	ExprContext *econtext = mtstate->ps.ps_ExprContext; | 	ExprContext *econtext = mtstate->ps.ps_ExprContext; | ||||||
| 	Relation	relation = resultRelInfo->ri_RelationDesc; | 	Relation	relation = resultRelInfo->ri_RelationDesc; | ||||||
| 	ExprState  *onConflictSetWhere = resultRelInfo->ri_onConflict->oc_WhereClause; | 	ExprState  *onConflictSetWhere = resultRelInfo->ri_onConflict->oc_WhereClause; | ||||||
|  | 	TupleTableSlot *existing = resultRelInfo->ri_onConflict->oc_Existing; | ||||||
| 	HeapTupleData tuple; | 	HeapTupleData tuple; | ||||||
| 	HeapUpdateFailureData hufd; | 	HeapUpdateFailureData hufd; | ||||||
| 	LockTupleMode lockmode; | 	LockTupleMode lockmode; | ||||||
| @@ -1413,7 +1414,7 @@ ExecOnConflictUpdate(ModifyTableState *mtstate, | |||||||
| 	ExecCheckHeapTupleVisible(estate, &tuple, buffer); | 	ExecCheckHeapTupleVisible(estate, &tuple, buffer); | ||||||
|  |  | ||||||
| 	/* Store target's existing tuple in the state's dedicated slot */ | 	/* Store target's existing tuple in the state's dedicated slot */ | ||||||
| 	ExecStoreBufferHeapTuple(&tuple, mtstate->mt_existing, buffer); | 	ExecStorePinnedBufferHeapTuple(&tuple, existing, buffer); | ||||||
|  |  | ||||||
| 	/* | 	/* | ||||||
| 	 * Make tuple and any needed join variables available to ExecQual and | 	 * Make tuple and any needed join variables available to ExecQual and | ||||||
| @@ -1422,13 +1423,13 @@ ExecOnConflictUpdate(ModifyTableState *mtstate, | |||||||
| 	 * has been made to reference INNER_VAR in setrefs.c, but there is no | 	 * has been made to reference INNER_VAR in setrefs.c, but there is no | ||||||
| 	 * other redirection. | 	 * other redirection. | ||||||
| 	 */ | 	 */ | ||||||
| 	econtext->ecxt_scantuple = mtstate->mt_existing; | 	econtext->ecxt_scantuple = existing; | ||||||
| 	econtext->ecxt_innertuple = excludedSlot; | 	econtext->ecxt_innertuple = excludedSlot; | ||||||
| 	econtext->ecxt_outertuple = NULL; | 	econtext->ecxt_outertuple = NULL; | ||||||
|  |  | ||||||
| 	if (!ExecQual(onConflictSetWhere, econtext)) | 	if (!ExecQual(onConflictSetWhere, econtext)) | ||||||
| 	{ | 	{ | ||||||
| 		ReleaseBuffer(buffer); | 		ExecClearTuple(existing);	/* see return below */ | ||||||
| 		InstrCountFiltered1(&mtstate->ps, 1); | 		InstrCountFiltered1(&mtstate->ps, 1); | ||||||
| 		return true;			/* done with the tuple */ | 		return true;			/* done with the tuple */ | ||||||
| 	} | 	} | ||||||
| @@ -1451,7 +1452,7 @@ ExecOnConflictUpdate(ModifyTableState *mtstate, | |||||||
| 		 * INSERT or UPDATE path. | 		 * INSERT or UPDATE path. | ||||||
| 		 */ | 		 */ | ||||||
| 		ExecWithCheckOptions(WCO_RLS_CONFLICT_CHECK, resultRelInfo, | 		ExecWithCheckOptions(WCO_RLS_CONFLICT_CHECK, resultRelInfo, | ||||||
| 							 mtstate->mt_existing, | 							 existing, | ||||||
| 							 mtstate->ps.state); | 							 mtstate->ps.state); | ||||||
| 	} | 	} | ||||||
|  |  | ||||||
| @@ -1469,11 +1470,17 @@ ExecOnConflictUpdate(ModifyTableState *mtstate, | |||||||
|  |  | ||||||
| 	/* Execute UPDATE with projection */ | 	/* Execute UPDATE with projection */ | ||||||
| 	*returning = ExecUpdate(mtstate, &tuple.t_self, NULL, | 	*returning = ExecUpdate(mtstate, &tuple.t_self, NULL, | ||||||
| 							mtstate->mt_conflproj, planSlot, | 							resultRelInfo->ri_onConflict->oc_ProjSlot, | ||||||
|  | 							planSlot, | ||||||
| 							&mtstate->mt_epqstate, mtstate->ps.state, | 							&mtstate->mt_epqstate, mtstate->ps.state, | ||||||
| 							canSetTag); | 							canSetTag); | ||||||
|  |  | ||||||
| 	ReleaseBuffer(buffer); | 	/* | ||||||
|  | 	 * Clear out existing tuple, as there might not be another conflict among | ||||||
|  | 	 * the next input rows. Don't want to hold resources till the end of the | ||||||
|  | 	 * query. | ||||||
|  | 	 */ | ||||||
|  | 	ExecClearTuple(existing); | ||||||
| 	return true; | 	return true; | ||||||
| } | } | ||||||
|  |  | ||||||
| @@ -1633,7 +1640,6 @@ ExecPrepareTupleRouting(ModifyTableState *mtstate, | |||||||
| 						ResultRelInfo *targetRelInfo, | 						ResultRelInfo *targetRelInfo, | ||||||
| 						TupleTableSlot *slot) | 						TupleTableSlot *slot) | ||||||
| { | { | ||||||
| 	ModifyTable *node; |  | ||||||
| 	ResultRelInfo *partrel; | 	ResultRelInfo *partrel; | ||||||
| 	PartitionRoutingInfo *partrouteinfo; | 	PartitionRoutingInfo *partrouteinfo; | ||||||
| 	TupleConversionMap *map; | 	TupleConversionMap *map; | ||||||
| @@ -1698,19 +1704,6 @@ ExecPrepareTupleRouting(ModifyTableState *mtstate, | |||||||
| 		slot = execute_attr_map_slot(map->attrMap, slot, new_slot); | 		slot = execute_attr_map_slot(map->attrMap, slot, new_slot); | ||||||
| 	} | 	} | ||||||
|  |  | ||||||
| 	/* Initialize information needed to handle ON CONFLICT DO UPDATE. */ |  | ||||||
| 	Assert(mtstate != NULL); |  | ||||||
| 	node = (ModifyTable *) mtstate->ps.plan; |  | ||||||
| 	if (node->onConflictAction == ONCONFLICT_UPDATE) |  | ||||||
| 	{ |  | ||||||
| 		Assert(mtstate->mt_existing != NULL); |  | ||||||
| 		ExecSetSlotDescriptor(mtstate->mt_existing, |  | ||||||
| 							  RelationGetDescr(partrel->ri_RelationDesc)); |  | ||||||
| 		Assert(mtstate->mt_conflproj != NULL); |  | ||||||
| 		ExecSetSlotDescriptor(mtstate->mt_conflproj, |  | ||||||
| 							  partrel->ri_onConflict->oc_ProjTupdesc); |  | ||||||
| 	} |  | ||||||
|  |  | ||||||
| 	return slot; | 	return slot; | ||||||
| } | } | ||||||
|  |  | ||||||
| @@ -2319,43 +2312,28 @@ ExecInitModifyTable(ModifyTable *node, EState *estate, int eflags) | |||||||
| 		econtext = mtstate->ps.ps_ExprContext; | 		econtext = mtstate->ps.ps_ExprContext; | ||||||
| 		relationDesc = resultRelInfo->ri_RelationDesc->rd_att; | 		relationDesc = resultRelInfo->ri_RelationDesc->rd_att; | ||||||
|  |  | ||||||
| 		/* |  | ||||||
| 		 * Initialize slot for the existing tuple.  If we'll be performing |  | ||||||
| 		 * tuple routing, the tuple descriptor to use for this will be |  | ||||||
| 		 * determined based on which relation the update is actually applied |  | ||||||
| 		 * to, so we don't set its tuple descriptor here. |  | ||||||
| 		 */ |  | ||||||
| 		mtstate->mt_existing = |  | ||||||
| 			ExecInitExtraTupleSlot(mtstate->ps.state, |  | ||||||
| 								   mtstate->mt_partition_tuple_routing ? |  | ||||||
| 								   NULL : relationDesc, &TTSOpsBufferHeapTuple); |  | ||||||
|  |  | ||||||
| 		/* carried forward solely for the benefit of explain */ | 		/* carried forward solely for the benefit of explain */ | ||||||
| 		mtstate->mt_excludedtlist = node->exclRelTlist; | 		mtstate->mt_excludedtlist = node->exclRelTlist; | ||||||
|  |  | ||||||
| 		/* create state for DO UPDATE SET operation */ | 		/* create state for DO UPDATE SET operation */ | ||||||
| 		resultRelInfo->ri_onConflict = makeNode(OnConflictSetState); | 		resultRelInfo->ri_onConflict = makeNode(OnConflictSetState); | ||||||
|  |  | ||||||
| 		/* | 		/* initialize slot for the existing tuple */ | ||||||
| 		 * Create the tuple slot for the UPDATE SET projection. | 		resultRelInfo->ri_onConflict->oc_Existing = | ||||||
| 		 * | 			ExecInitExtraTupleSlot(mtstate->ps.state, relationDesc, | ||||||
| 		 * Just like mt_existing above, we leave it without a tuple descriptor | 								   &TTSOpsBufferHeapTuple); | ||||||
| 		 * in the case of partitioning tuple routing, so that it can be |  | ||||||
| 		 * changed by ExecPrepareTupleRouting.  In that case, we still save | 		/* create the tuple slot for the UPDATE SET projection */ | ||||||
| 		 * the tupdesc in the parent's state: it can be reused by partitions |  | ||||||
| 		 * with an identical descriptor to the parent. |  | ||||||
| 		 */ |  | ||||||
| 		tupDesc = ExecTypeFromTL((List *) node->onConflictSet); | 		tupDesc = ExecTypeFromTL((List *) node->onConflictSet); | ||||||
| 		mtstate->mt_conflproj = | 		resultRelInfo->ri_onConflict->oc_ProjSlot = | ||||||
| 			ExecInitExtraTupleSlot(mtstate->ps.state, | 			ExecInitExtraTupleSlot(mtstate->ps.state, tupDesc, | ||||||
| 								   mtstate->mt_partition_tuple_routing ? | 								   &TTSOpsVirtual); | ||||||
| 								   NULL : tupDesc, &TTSOpsHeapTuple); |  | ||||||
| 		resultRelInfo->ri_onConflict->oc_ProjTupdesc = tupDesc; |  | ||||||
|  |  | ||||||
| 		/* build UPDATE SET projection state */ | 		/* build UPDATE SET projection state */ | ||||||
| 		resultRelInfo->ri_onConflict->oc_ProjInfo = | 		resultRelInfo->ri_onConflict->oc_ProjInfo = | ||||||
| 			ExecBuildProjectionInfo(node->onConflictSet, econtext, | 			ExecBuildProjectionInfo(node->onConflictSet, econtext, | ||||||
| 									mtstate->mt_conflproj, &mtstate->ps, | 									resultRelInfo->ri_onConflict->oc_ProjSlot, | ||||||
|  | 									&mtstate->ps, | ||||||
| 									relationDesc); | 									relationDesc); | ||||||
|  |  | ||||||
| 		/* initialize state to evaluate the WHERE clause, if any */ | 		/* initialize state to evaluate the WHERE clause, if any */ | ||||||
|   | |||||||
| @@ -377,8 +377,9 @@ typedef struct OnConflictSetState | |||||||
| { | { | ||||||
| 	NodeTag		type; | 	NodeTag		type; | ||||||
|  |  | ||||||
|  | 	TupleTableSlot *oc_Existing;	/* slot to store existing target tuple in */ | ||||||
|  | 	TupleTableSlot *oc_ProjSlot;	/* CONFLICT ... SET ... projection target */ | ||||||
| 	ProjectionInfo *oc_ProjInfo;	/* for ON CONFLICT DO UPDATE SET */ | 	ProjectionInfo *oc_ProjInfo;	/* for ON CONFLICT DO UPDATE SET */ | ||||||
| 	TupleDesc	oc_ProjTupdesc; /* TupleDesc for the above projection */ |  | ||||||
| 	ExprState  *oc_WhereClause; /* state for the WHERE clause */ | 	ExprState  *oc_WhereClause; /* state for the WHERE clause */ | ||||||
| } OnConflictSetState; | } OnConflictSetState; | ||||||
|  |  | ||||||
| @@ -1109,9 +1110,7 @@ typedef struct ModifyTableState | |||||||
| 	List	  **mt_arowmarks;	/* per-subplan ExecAuxRowMark lists */ | 	List	  **mt_arowmarks;	/* per-subplan ExecAuxRowMark lists */ | ||||||
| 	EPQState	mt_epqstate;	/* for evaluating EvalPlanQual rechecks */ | 	EPQState	mt_epqstate;	/* for evaluating EvalPlanQual rechecks */ | ||||||
| 	bool		fireBSTriggers; /* do we need to fire stmt triggers? */ | 	bool		fireBSTriggers; /* do we need to fire stmt triggers? */ | ||||||
| 	TupleTableSlot *mt_existing;	/* slot to store existing target tuple in */ |  | ||||||
| 	List	   *mt_excludedtlist;	/* the excluded pseudo relation's tlist  */ | 	List	   *mt_excludedtlist;	/* the excluded pseudo relation's tlist  */ | ||||||
| 	TupleTableSlot *mt_conflproj;	/* CONFLICT ... SET ... projection target */ |  | ||||||
|  |  | ||||||
| 	/* | 	/* | ||||||
| 	 * Slot for storing tuples in the root partitioned table's rowtype during | 	 * Slot for storing tuples in the root partitioned table's rowtype during | ||||||
|   | |||||||
		Reference in New Issue
	
	Block a user