mirror of
				https://github.com/postgres/postgres.git
				synced 2025-10-25 13:17:41 +03:00 
			
		
		
		
	Collect JIT instrumentation from workers.
Previously, when using parallel query, EXPLAIN (ANALYZE)'s JIT compilation timings did not include the overhead from doing so on the workers. Fix that. We do so by simply aggregating the cost of doing JIT compilation on workers and the leader together. Arguably that's not quite accurate, because the total time spend doing so is spent in parallel - but it's hard to do much better. For additional detail, when VERBOSE is specified, the stats for workers are displayed separately. Author: Amit Khandekar and Andres Freund Discussion: https://postgr.es/m/CAJ3gD9eLrz51RK_gTkod+71iDcjpB_N8eC6vU2AW-VicsAERpQ@mail.gmail.com Backpatch: 11-
This commit is contained in:
		| @@ -362,9 +362,9 @@ explain_ExecutorEnd(QueryDesc *queryDesc) | |||||||
| 			ExplainPrintPlan(es, queryDesc); | 			ExplainPrintPlan(es, queryDesc); | ||||||
| 			if (es->analyze && auto_explain_log_triggers) | 			if (es->analyze && auto_explain_log_triggers) | ||||||
| 				ExplainPrintTriggers(es, queryDesc); | 				ExplainPrintTriggers(es, queryDesc); | ||||||
| 			if (queryDesc->estate->es_jit && es->costs && | 			if (es->costs) | ||||||
| 				queryDesc->estate->es_jit->created_functions > 0) | 				ExplainPrintJIT(es, queryDesc->estate->es_jit_flags, | ||||||
| 				ExplainPrintJIT(es, queryDesc); | 								queryDesc->estate->es_jit_combined_instr, -1); | ||||||
| 			ExplainEndOutput(es); | 			ExplainEndOutput(es); | ||||||
|  |  | ||||||
| 			/* Remove last line break */ | 			/* Remove last line break */ | ||||||
|   | |||||||
| @@ -563,9 +563,9 @@ ExplainOnePlan(PlannedStmt *plannedstmt, IntoClause *into, ExplainState *es, | |||||||
| 	 * depending on build options.  Might want to separate that out from COSTS | 	 * depending on build options.  Might want to separate that out from COSTS | ||||||
| 	 * at a later stage. | 	 * at a later stage. | ||||||
| 	 */ | 	 */ | ||||||
| 	if (queryDesc->estate->es_jit && es->costs && | 	if (es->costs) | ||||||
| 		queryDesc->estate->es_jit->created_functions > 0) | 		ExplainPrintJIT(es, queryDesc->estate->es_jit_flags, | ||||||
| 		ExplainPrintJIT(es, queryDesc); | 						queryDesc->estate->es_jit_combined_instr, -1); | ||||||
|  |  | ||||||
| 	/* | 	/* | ||||||
| 	 * Close down the query and free resources.  Include time for this in the | 	 * Close down the query and free resources.  Include time for this in the | ||||||
| @@ -691,19 +691,27 @@ ExplainPrintTriggers(ExplainState *es, QueryDesc *queryDesc) | |||||||
| /* | /* | ||||||
|  * ExplainPrintJIT - |  * ExplainPrintJIT - | ||||||
|  *	  Append information about JITing to es->str. |  *	  Append information about JITing to es->str. | ||||||
|  |  * | ||||||
|  |  * Can be used to print the JIT instrumentation of the backend (worker_num = | ||||||
|  |  * -1) or that of a specific worker (worker_num = ...). | ||||||
|  */ |  */ | ||||||
| void | void | ||||||
| ExplainPrintJIT(ExplainState *es, QueryDesc *queryDesc) | ExplainPrintJIT(ExplainState *es, int jit_flags, | ||||||
|  | 				JitInstrumentation *ji, int worker_num) | ||||||
| { | { | ||||||
| 	JitContext *jc = queryDesc->estate->es_jit; |  | ||||||
| 	instr_time	total_time; | 	instr_time	total_time; | ||||||
|  | 	bool		for_workers = (worker_num >= 0); | ||||||
|  |  | ||||||
|  | 	/* don't print information if no JITing happened */ | ||||||
|  | 	if (!ji || ji->created_functions == 0) | ||||||
|  | 		return; | ||||||
|  |  | ||||||
| 	/* calculate total time */ | 	/* calculate total time */ | ||||||
| 	INSTR_TIME_SET_ZERO(total_time); | 	INSTR_TIME_SET_ZERO(total_time); | ||||||
| 	INSTR_TIME_ADD(total_time, jc->generation_counter); | 	INSTR_TIME_ADD(total_time, ji->generation_counter); | ||||||
| 	INSTR_TIME_ADD(total_time, jc->inlining_counter); | 	INSTR_TIME_ADD(total_time, ji->inlining_counter); | ||||||
| 	INSTR_TIME_ADD(total_time, jc->optimization_counter); | 	INSTR_TIME_ADD(total_time, ji->optimization_counter); | ||||||
| 	INSTR_TIME_ADD(total_time, jc->emission_counter); | 	INSTR_TIME_ADD(total_time, ji->emission_counter); | ||||||
|  |  | ||||||
| 	ExplainOpenGroup("JIT", "JIT", true, es); | 	ExplainOpenGroup("JIT", "JIT", true, es); | ||||||
|  |  | ||||||
| @@ -711,27 +719,30 @@ ExplainPrintJIT(ExplainState *es, QueryDesc *queryDesc) | |||||||
| 	if (es->format == EXPLAIN_FORMAT_TEXT) | 	if (es->format == EXPLAIN_FORMAT_TEXT) | ||||||
| 	{ | 	{ | ||||||
| 		appendStringInfoSpaces(es->str, es->indent * 2); | 		appendStringInfoSpaces(es->str, es->indent * 2); | ||||||
|  | 		if (for_workers) | ||||||
|  | 			appendStringInfo(es->str, "JIT for worker %u:\n", worker_num); | ||||||
|  | 		else | ||||||
| 			appendStringInfo(es->str, "JIT:\n"); | 			appendStringInfo(es->str, "JIT:\n"); | ||||||
| 		es->indent += 1; | 		es->indent += 1; | ||||||
|  |  | ||||||
| 		ExplainPropertyInteger("Functions", NULL, jc->created_functions, es); | 		ExplainPropertyInteger("Functions", NULL, ji->created_functions, es); | ||||||
|  |  | ||||||
| 		appendStringInfoSpaces(es->str, es->indent * 2); | 		appendStringInfoSpaces(es->str, es->indent * 2); | ||||||
| 		appendStringInfo(es->str, "Options: %s %s, %s %s, %s %s, %s %s\n", | 		appendStringInfo(es->str, "Options: %s %s, %s %s, %s %s, %s %s\n", | ||||||
| 						 "Inlining", jc->flags & PGJIT_INLINE ? "true" : "false", | 						 "Inlining", jit_flags & PGJIT_INLINE ? "true" : "false", | ||||||
| 						 "Optimization", jc->flags & PGJIT_OPT3 ? "true" : "false", | 						 "Optimization", jit_flags & PGJIT_OPT3 ? "true" : "false", | ||||||
| 						 "Expressions", jc->flags & PGJIT_EXPR ? "true" : "false", | 						 "Expressions", jit_flags & PGJIT_EXPR ? "true" : "false", | ||||||
| 						 "Deforming", jc->flags & PGJIT_DEFORM ? "true" : "false"); | 						 "Deforming", jit_flags & PGJIT_DEFORM ? "true" : "false"); | ||||||
|  |  | ||||||
| 		if (es->analyze && es->timing) | 		if (es->analyze && es->timing) | ||||||
| 		{ | 		{ | ||||||
| 			appendStringInfoSpaces(es->str, es->indent * 2); | 			appendStringInfoSpaces(es->str, es->indent * 2); | ||||||
| 			appendStringInfo(es->str, | 			appendStringInfo(es->str, | ||||||
| 							 "Timing: %s %.3f ms, %s %.3f ms, %s %.3f ms, %s %.3f ms, %s %.3f ms\n", | 							 "Timing: %s %.3f ms, %s %.3f ms, %s %.3f ms, %s %.3f ms, %s %.3f ms\n", | ||||||
| 							 "Generation", 1000.0 * INSTR_TIME_GET_DOUBLE(jc->generation_counter), | 							 "Generation", 1000.0 * INSTR_TIME_GET_DOUBLE(ji->generation_counter), | ||||||
| 							 "Inlining", 1000.0 * INSTR_TIME_GET_DOUBLE(jc->inlining_counter), | 							 "Inlining", 1000.0 * INSTR_TIME_GET_DOUBLE(ji->inlining_counter), | ||||||
| 							 "Optimization", 1000.0 * INSTR_TIME_GET_DOUBLE(jc->optimization_counter), | 							 "Optimization", 1000.0 * INSTR_TIME_GET_DOUBLE(ji->optimization_counter), | ||||||
| 							 "Emission", 1000.0 * INSTR_TIME_GET_DOUBLE(jc->emission_counter), | 							 "Emission", 1000.0 * INSTR_TIME_GET_DOUBLE(ji->emission_counter), | ||||||
| 							 "Total", 1000.0 * INSTR_TIME_GET_DOUBLE(total_time)); | 							 "Total", 1000.0 * INSTR_TIME_GET_DOUBLE(total_time)); | ||||||
| 		} | 		} | ||||||
|  |  | ||||||
| @@ -739,13 +750,14 @@ ExplainPrintJIT(ExplainState *es, QueryDesc *queryDesc) | |||||||
| 	} | 	} | ||||||
| 	else | 	else | ||||||
| 	{ | 	{ | ||||||
| 		ExplainPropertyInteger("Functions", NULL, jc->created_functions, es); | 		ExplainPropertyInteger("Worker Number", NULL, worker_num, es); | ||||||
|  | 		ExplainPropertyInteger("Functions", NULL, ji->created_functions, es); | ||||||
|  |  | ||||||
| 		ExplainOpenGroup("Options", "Options", true, es); | 		ExplainOpenGroup("Options", "Options", true, es); | ||||||
| 		ExplainPropertyBool("Inlining", jc->flags & PGJIT_INLINE, es); | 		ExplainPropertyBool("Inlining", jit_flags & PGJIT_INLINE, es); | ||||||
| 		ExplainPropertyBool("Optimization", jc->flags & PGJIT_OPT3, es); | 		ExplainPropertyBool("Optimization", jit_flags & PGJIT_OPT3, es); | ||||||
| 		ExplainPropertyBool("Expressions", jc->flags & PGJIT_EXPR, es); | 		ExplainPropertyBool("Expressions", jit_flags & PGJIT_EXPR, es); | ||||||
| 		ExplainPropertyBool("Deforming", jc->flags & PGJIT_DEFORM, es); | 		ExplainPropertyBool("Deforming", jit_flags & PGJIT_DEFORM, es); | ||||||
| 		ExplainCloseGroup("Options", "Options", true, es); | 		ExplainCloseGroup("Options", "Options", true, es); | ||||||
|  |  | ||||||
| 		if (es->analyze && es->timing) | 		if (es->analyze && es->timing) | ||||||
| @@ -753,16 +765,16 @@ ExplainPrintJIT(ExplainState *es, QueryDesc *queryDesc) | |||||||
| 			ExplainOpenGroup("Timing", "Timing", true, es); | 			ExplainOpenGroup("Timing", "Timing", true, es); | ||||||
|  |  | ||||||
| 			ExplainPropertyFloat("Generation", "ms", | 			ExplainPropertyFloat("Generation", "ms", | ||||||
| 								 1000.0 * INSTR_TIME_GET_DOUBLE(jc->generation_counter), | 								 1000.0 * INSTR_TIME_GET_DOUBLE(ji->generation_counter), | ||||||
| 								 3, es); | 								 3, es); | ||||||
| 			ExplainPropertyFloat("Inlining", "ms", | 			ExplainPropertyFloat("Inlining", "ms", | ||||||
| 								 1000.0 * INSTR_TIME_GET_DOUBLE(jc->inlining_counter), | 								 1000.0 * INSTR_TIME_GET_DOUBLE(ji->inlining_counter), | ||||||
| 								 3, es); | 								 3, es); | ||||||
| 			ExplainPropertyFloat("Optimization", "ms", | 			ExplainPropertyFloat("Optimization", "ms", | ||||||
| 								 1000.0 * INSTR_TIME_GET_DOUBLE(jc->optimization_counter), | 								 1000.0 * INSTR_TIME_GET_DOUBLE(ji->optimization_counter), | ||||||
| 								 3, es); | 								 3, es); | ||||||
| 			ExplainPropertyFloat("Emission", "ms", | 			ExplainPropertyFloat("Emission", "ms", | ||||||
| 								 1000.0 * INSTR_TIME_GET_DOUBLE(jc->emission_counter), | 								 1000.0 * INSTR_TIME_GET_DOUBLE(ji->emission_counter), | ||||||
| 								 3, es); | 								 3, es); | ||||||
| 			ExplainPropertyFloat("Total", "ms", | 			ExplainPropertyFloat("Total", "ms", | ||||||
| 								 1000.0 * INSTR_TIME_GET_DOUBLE(total_time), | 								 1000.0 * INSTR_TIME_GET_DOUBLE(total_time), | ||||||
| @@ -1554,6 +1566,25 @@ ExplainNode(PlanState *planstate, List *ancestors, | |||||||
| 					ExplainPropertyInteger("Workers Launched", NULL, | 					ExplainPropertyInteger("Workers Launched", NULL, | ||||||
| 										   nworkers, es); | 										   nworkers, es); | ||||||
| 				} | 				} | ||||||
|  |  | ||||||
|  | 				/* | ||||||
|  | 				 * Print per-worker Jit instrumentation. Use same conditions | ||||||
|  | 				 * as for the leader's JIT instrumentation, see comment there. | ||||||
|  | 				 */ | ||||||
|  | 				if (es->costs && es->verbose && | ||||||
|  | 					outerPlanState(planstate)->worker_jit_instrument) | ||||||
|  | 				{ | ||||||
|  | 					PlanState *child = outerPlanState(planstate); | ||||||
|  | 					int			n; | ||||||
|  | 					SharedJitInstrumentation *w = child->worker_jit_instrument; | ||||||
|  |  | ||||||
|  | 					for (n = 0; n < w->num_workers; ++n) | ||||||
|  | 					{ | ||||||
|  | 						ExplainPrintJIT(es, child->state->es_jit_flags, | ||||||
|  | 										&w->jit_instr[n], n); | ||||||
|  | 					} | ||||||
|  | 				} | ||||||
|  |  | ||||||
| 				if (gather->single_copy || es->format != EXPLAIN_FORMAT_TEXT) | 				if (gather->single_copy || es->format != EXPLAIN_FORMAT_TEXT) | ||||||
| 					ExplainPropertyBool("Single Copy", gather->single_copy, es); | 					ExplainPropertyBool("Single Copy", gather->single_copy, es); | ||||||
| 			} | 			} | ||||||
|   | |||||||
| @@ -48,6 +48,7 @@ | |||||||
| #include "executor/execdebug.h" | #include "executor/execdebug.h" | ||||||
| #include "executor/nodeSubplan.h" | #include "executor/nodeSubplan.h" | ||||||
| #include "foreign/fdwapi.h" | #include "foreign/fdwapi.h" | ||||||
|  | #include "jit/jit.h" | ||||||
| #include "mb/pg_wchar.h" | #include "mb/pg_wchar.h" | ||||||
| #include "miscadmin.h" | #include "miscadmin.h" | ||||||
| #include "optimizer/clauses.h" | #include "optimizer/clauses.h" | ||||||
| @@ -494,6 +495,21 @@ standard_ExecutorEnd(QueryDesc *queryDesc) | |||||||
|  |  | ||||||
| 	ExecEndPlan(queryDesc->planstate, estate); | 	ExecEndPlan(queryDesc->planstate, estate); | ||||||
|  |  | ||||||
|  | 	/* | ||||||
|  | 	 * If this process has done JIT, either merge stats into worker stats, or | ||||||
|  | 	 * use this process' stats as the global stats if no parallelism was used | ||||||
|  | 	 * / no workers did JIT. | ||||||
|  | 	 */ | ||||||
|  | 	if (estate->es_instrument && queryDesc->estate->es_jit) | ||||||
|  | 	{ | ||||||
|  | 		if (queryDesc->estate->es_jit_combined_instr) | ||||||
|  | 			InstrJitAgg(queryDesc->estate->es_jit_combined_instr, | ||||||
|  | 						&queryDesc->estate->es_jit->instr); | ||||||
|  | 		else | ||||||
|  | 			queryDesc->estate->es_jit_combined_instr = | ||||||
|  | 				&queryDesc->estate->es_jit->instr; | ||||||
|  | 	} | ||||||
|  |  | ||||||
| 	/* do away with our snapshots */ | 	/* do away with our snapshots */ | ||||||
| 	UnregisterSnapshot(estate->es_snapshot); | 	UnregisterSnapshot(estate->es_snapshot); | ||||||
| 	UnregisterSnapshot(estate->es_crosscheck_snapshot); | 	UnregisterSnapshot(estate->es_crosscheck_snapshot); | ||||||
|   | |||||||
| @@ -37,6 +37,7 @@ | |||||||
| #include "executor/nodeSort.h" | #include "executor/nodeSort.h" | ||||||
| #include "executor/nodeSubplan.h" | #include "executor/nodeSubplan.h" | ||||||
| #include "executor/tqueue.h" | #include "executor/tqueue.h" | ||||||
|  | #include "jit/jit.h" | ||||||
| #include "nodes/nodeFuncs.h" | #include "nodes/nodeFuncs.h" | ||||||
| #include "optimizer/planmain.h" | #include "optimizer/planmain.h" | ||||||
| #include "optimizer/planner.h" | #include "optimizer/planner.h" | ||||||
| @@ -62,6 +63,7 @@ | |||||||
| #define PARALLEL_KEY_INSTRUMENTATION	UINT64CONST(0xE000000000000006) | #define PARALLEL_KEY_INSTRUMENTATION	UINT64CONST(0xE000000000000006) | ||||||
| #define PARALLEL_KEY_DSA				UINT64CONST(0xE000000000000007) | #define PARALLEL_KEY_DSA				UINT64CONST(0xE000000000000007) | ||||||
| #define PARALLEL_KEY_QUERY_TEXT		UINT64CONST(0xE000000000000008) | #define PARALLEL_KEY_QUERY_TEXT		UINT64CONST(0xE000000000000008) | ||||||
|  | #define PARALLEL_KEY_JIT_INSTRUMENTATION UINT64CONST(0xE000000000000009) | ||||||
|  |  | ||||||
| #define PARALLEL_TUPLE_QUEUE_SIZE		65536 | #define PARALLEL_TUPLE_QUEUE_SIZE		65536 | ||||||
|  |  | ||||||
| @@ -573,9 +575,11 @@ ExecInitParallelPlan(PlanState *planstate, EState *estate, | |||||||
| 	char	   *paramlistinfo_space; | 	char	   *paramlistinfo_space; | ||||||
| 	BufferUsage *bufusage_space; | 	BufferUsage *bufusage_space; | ||||||
| 	SharedExecutorInstrumentation *instrumentation = NULL; | 	SharedExecutorInstrumentation *instrumentation = NULL; | ||||||
|  | 	SharedJitInstrumentation *jit_instrumentation = NULL; | ||||||
| 	int			pstmt_len; | 	int			pstmt_len; | ||||||
| 	int			paramlistinfo_len; | 	int			paramlistinfo_len; | ||||||
| 	int			instrumentation_len = 0; | 	int			instrumentation_len = 0; | ||||||
|  | 	int			jit_instrumentation_len = 0; | ||||||
| 	int			instrument_offset = 0; | 	int			instrument_offset = 0; | ||||||
| 	Size		dsa_minsize = dsa_minimum_size(); | 	Size		dsa_minsize = dsa_minimum_size(); | ||||||
| 	char	   *query_string; | 	char	   *query_string; | ||||||
| @@ -669,6 +673,16 @@ ExecInitParallelPlan(PlanState *planstate, EState *estate, | |||||||
| 					 mul_size(e.nnodes, nworkers)); | 					 mul_size(e.nnodes, nworkers)); | ||||||
| 		shm_toc_estimate_chunk(&pcxt->estimator, instrumentation_len); | 		shm_toc_estimate_chunk(&pcxt->estimator, instrumentation_len); | ||||||
| 		shm_toc_estimate_keys(&pcxt->estimator, 1); | 		shm_toc_estimate_keys(&pcxt->estimator, 1); | ||||||
|  |  | ||||||
|  | 		/* Estimate space for JIT instrumentation, if required. */ | ||||||
|  | 		if (estate->es_jit_flags != PGJIT_NONE) | ||||||
|  | 		{ | ||||||
|  | 			jit_instrumentation_len = | ||||||
|  | 				offsetof(SharedJitInstrumentation, jit_instr) + | ||||||
|  | 				sizeof(JitInstrumentation) * nworkers; | ||||||
|  | 			shm_toc_estimate_chunk(&pcxt->estimator, jit_instrumentation_len); | ||||||
|  | 			shm_toc_estimate_keys(&pcxt->estimator, 1); | ||||||
|  | 		} | ||||||
| 	} | 	} | ||||||
|  |  | ||||||
| 	/* Estimate space for DSA area. */ | 	/* Estimate space for DSA area. */ | ||||||
| @@ -742,6 +756,18 @@ ExecInitParallelPlan(PlanState *planstate, EState *estate, | |||||||
| 		shm_toc_insert(pcxt->toc, PARALLEL_KEY_INSTRUMENTATION, | 		shm_toc_insert(pcxt->toc, PARALLEL_KEY_INSTRUMENTATION, | ||||||
| 					   instrumentation); | 					   instrumentation); | ||||||
| 		pei->instrumentation = instrumentation; | 		pei->instrumentation = instrumentation; | ||||||
|  |  | ||||||
|  | 		if (estate->es_jit_flags != PGJIT_NONE) | ||||||
|  | 		{ | ||||||
|  | 			jit_instrumentation = shm_toc_allocate(pcxt->toc, | ||||||
|  | 												   jit_instrumentation_len); | ||||||
|  | 			jit_instrumentation->num_workers = nworkers; | ||||||
|  | 			memset(jit_instrumentation->jit_instr, 0, | ||||||
|  | 				   sizeof(JitInstrumentation) * nworkers); | ||||||
|  | 			shm_toc_insert(pcxt->toc, PARALLEL_KEY_JIT_INSTRUMENTATION, | ||||||
|  | 						   jit_instrumentation); | ||||||
|  | 			pei->jit_instrumentation = jit_instrumentation; | ||||||
|  | 		} | ||||||
| 	} | 	} | ||||||
|  |  | ||||||
| 	/* | 	/* | ||||||
| @@ -1003,6 +1029,46 @@ ExecParallelRetrieveInstrumentation(PlanState *planstate, | |||||||
| 								 instrumentation); | 								 instrumentation); | ||||||
| } | } | ||||||
|  |  | ||||||
|  | /* | ||||||
|  |  * Add up the workers' JIT instrumentation from dynamic shared memory. | ||||||
|  |  */ | ||||||
|  | static void | ||||||
|  | ExecParallelRetrieveJitInstrumentation(PlanState *planstate, | ||||||
|  | 									   SharedJitInstrumentation *shared_jit) | ||||||
|  | { | ||||||
|  | 	JitInstrumentation *combined; | ||||||
|  | 	int			ibytes; | ||||||
|  |  | ||||||
|  | 	int			n; | ||||||
|  |  | ||||||
|  | 	/* | ||||||
|  | 	 * Accumulate worker JIT instrumentation into the combined JIT | ||||||
|  | 	 * instrumentation, allocating it if required. Note this is kept separate | ||||||
|  | 	 * from the leader's own instrumentation. | ||||||
|  | 	 */ | ||||||
|  | 	if (!planstate->state->es_jit_combined_instr) | ||||||
|  | 		planstate->state->es_jit_combined_instr = | ||||||
|  | 			MemoryContextAllocZero(planstate->state->es_query_cxt, sizeof(JitInstrumentation)); | ||||||
|  | 	combined = planstate->state->es_jit_combined_instr; | ||||||
|  |  | ||||||
|  | 	/* Accummulate all the workers' instrumentations. */ | ||||||
|  | 	for (n = 0; n < shared_jit->num_workers; ++n) | ||||||
|  | 		InstrJitAgg(combined, &shared_jit->jit_instr[n]); | ||||||
|  |  | ||||||
|  | 	/* | ||||||
|  | 	 * Store the per-worker detail. | ||||||
|  | 	 * | ||||||
|  | 	 * Similar to ExecParallelRetrieveInstrumentation(), allocate the | ||||||
|  | 	 * instrumentation in per-query context. | ||||||
|  | 	 */ | ||||||
|  | 	ibytes = offsetof(SharedJitInstrumentation, jit_instr) | ||||||
|  | 			 + mul_size(shared_jit->num_workers, sizeof(JitInstrumentation)); | ||||||
|  | 	planstate->worker_jit_instrument = | ||||||
|  | 		MemoryContextAlloc(planstate->state->es_query_cxt, ibytes); | ||||||
|  |  | ||||||
|  | 	memcpy(planstate->worker_jit_instrument, shared_jit, ibytes); | ||||||
|  | } | ||||||
|  |  | ||||||
| /* | /* | ||||||
|  * Finish parallel execution.  We wait for parallel workers to finish, and |  * Finish parallel execution.  We wait for parallel workers to finish, and | ||||||
|  * accumulate their buffer usage. |  * accumulate their buffer usage. | ||||||
| @@ -1068,6 +1134,11 @@ ExecParallelCleanup(ParallelExecutorInfo *pei) | |||||||
| 		ExecParallelRetrieveInstrumentation(pei->planstate, | 		ExecParallelRetrieveInstrumentation(pei->planstate, | ||||||
| 											pei->instrumentation); | 											pei->instrumentation); | ||||||
|  |  | ||||||
|  | 	/* Accumulate JIT instrumentation, if any. */ | ||||||
|  | 	if (pei->jit_instrumentation) | ||||||
|  | 		ExecParallelRetrieveJitInstrumentation(pei->planstate, | ||||||
|  | 											pei->jit_instrumentation); | ||||||
|  |  | ||||||
| 	/* Free any serialized parameters. */ | 	/* Free any serialized parameters. */ | ||||||
| 	if (DsaPointerIsValid(pei->param_exec)) | 	if (DsaPointerIsValid(pei->param_exec)) | ||||||
| 	{ | 	{ | ||||||
| @@ -1274,6 +1345,7 @@ ParallelQueryMain(dsm_segment *seg, shm_toc *toc) | |||||||
| 	DestReceiver *receiver; | 	DestReceiver *receiver; | ||||||
| 	QueryDesc  *queryDesc; | 	QueryDesc  *queryDesc; | ||||||
| 	SharedExecutorInstrumentation *instrumentation; | 	SharedExecutorInstrumentation *instrumentation; | ||||||
|  | 	SharedJitInstrumentation *jit_instrumentation; | ||||||
| 	int			instrument_options = 0; | 	int			instrument_options = 0; | ||||||
| 	void	   *area_space; | 	void	   *area_space; | ||||||
| 	dsa_area   *area; | 	dsa_area   *area; | ||||||
| @@ -1287,6 +1359,8 @@ ParallelQueryMain(dsm_segment *seg, shm_toc *toc) | |||||||
| 	instrumentation = shm_toc_lookup(toc, PARALLEL_KEY_INSTRUMENTATION, true); | 	instrumentation = shm_toc_lookup(toc, PARALLEL_KEY_INSTRUMENTATION, true); | ||||||
| 	if (instrumentation != NULL) | 	if (instrumentation != NULL) | ||||||
| 		instrument_options = instrumentation->instrument_options; | 		instrument_options = instrumentation->instrument_options; | ||||||
|  | 	jit_instrumentation = shm_toc_lookup(toc, PARALLEL_KEY_JIT_INSTRUMENTATION, | ||||||
|  | 										 true); | ||||||
| 	queryDesc = ExecParallelGetQueryDesc(toc, receiver, instrument_options); | 	queryDesc = ExecParallelGetQueryDesc(toc, receiver, instrument_options); | ||||||
|  |  | ||||||
| 	/* Setting debug_query_string for individual workers */ | 	/* Setting debug_query_string for individual workers */ | ||||||
| @@ -1350,6 +1424,14 @@ ParallelQueryMain(dsm_segment *seg, shm_toc *toc) | |||||||
| 		ExecParallelReportInstrumentation(queryDesc->planstate, | 		ExecParallelReportInstrumentation(queryDesc->planstate, | ||||||
| 										  instrumentation); | 										  instrumentation); | ||||||
|  |  | ||||||
|  | 	/* Report JIT instrumentation data if any */ | ||||||
|  | 	if (queryDesc->estate->es_jit && jit_instrumentation != NULL) | ||||||
|  | 	{ | ||||||
|  | 		Assert(ParallelWorkerNumber < jit_instrumentation->num_workers); | ||||||
|  | 		jit_instrumentation->jit_instr[ParallelWorkerNumber] = | ||||||
|  | 			queryDesc->estate->es_jit->instr; | ||||||
|  | 	} | ||||||
|  |  | ||||||
| 	/* Must do this after capturing instrumentation. */ | 	/* Must do this after capturing instrumentation. */ | ||||||
| 	ExecutorEnd(queryDesc); | 	ExecutorEnd(queryDesc); | ||||||
|  |  | ||||||
|   | |||||||
| @@ -182,6 +182,17 @@ jit_compile_expr(struct ExprState *state) | |||||||
| 	return false; | 	return false; | ||||||
| } | } | ||||||
|  |  | ||||||
|  | /* Aggregate JIT instrumentation information */ | ||||||
|  | void | ||||||
|  | InstrJitAgg(JitInstrumentation *dst, JitInstrumentation *add) | ||||||
|  | { | ||||||
|  | 	dst->created_functions += add->created_functions; | ||||||
|  | 	INSTR_TIME_ADD(dst->generation_counter, add->generation_counter); | ||||||
|  | 	INSTR_TIME_ADD(dst->inlining_counter, add->inlining_counter); | ||||||
|  | 	INSTR_TIME_ADD(dst->optimization_counter, add->optimization_counter); | ||||||
|  | 	INSTR_TIME_ADD(dst->emission_counter, add->emission_counter); | ||||||
|  | } | ||||||
|  |  | ||||||
| static bool | static bool | ||||||
| file_exists(const char *name) | file_exists(const char *name) | ||||||
| { | { | ||||||
|   | |||||||
| @@ -224,7 +224,7 @@ llvm_expand_funcname(struct LLVMJitContext *context, const char *basename) | |||||||
| { | { | ||||||
| 	Assert(context->module != NULL); | 	Assert(context->module != NULL); | ||||||
|  |  | ||||||
| 	context->base.created_functions++; | 	context->base.instr.created_functions++; | ||||||
|  |  | ||||||
| 	/* | 	/* | ||||||
| 	 * Previously we used dots to separate, but turns out some tools, e.g. | 	 * Previously we used dots to separate, but turns out some tools, e.g. | ||||||
| @@ -504,7 +504,7 @@ llvm_compile_module(LLVMJitContext *context) | |||||||
| 		INSTR_TIME_SET_CURRENT(starttime); | 		INSTR_TIME_SET_CURRENT(starttime); | ||||||
| 		llvm_inline(context->module); | 		llvm_inline(context->module); | ||||||
| 		INSTR_TIME_SET_CURRENT(endtime); | 		INSTR_TIME_SET_CURRENT(endtime); | ||||||
| 		INSTR_TIME_ACCUM_DIFF(context->base.inlining_counter, | 		INSTR_TIME_ACCUM_DIFF(context->base.instr.inlining_counter, | ||||||
| 							  endtime, starttime); | 							  endtime, starttime); | ||||||
| 	} | 	} | ||||||
|  |  | ||||||
| @@ -524,7 +524,7 @@ llvm_compile_module(LLVMJitContext *context) | |||||||
| 	INSTR_TIME_SET_CURRENT(starttime); | 	INSTR_TIME_SET_CURRENT(starttime); | ||||||
| 	llvm_optimize_module(context, context->module); | 	llvm_optimize_module(context, context->module); | ||||||
| 	INSTR_TIME_SET_CURRENT(endtime); | 	INSTR_TIME_SET_CURRENT(endtime); | ||||||
| 	INSTR_TIME_ACCUM_DIFF(context->base.optimization_counter, | 	INSTR_TIME_ACCUM_DIFF(context->base.instr.optimization_counter, | ||||||
| 						  endtime, starttime); | 						  endtime, starttime); | ||||||
|  |  | ||||||
| 	if (jit_dump_bitcode) | 	if (jit_dump_bitcode) | ||||||
| @@ -575,7 +575,7 @@ llvm_compile_module(LLVMJitContext *context) | |||||||
| 	} | 	} | ||||||
| #endif | #endif | ||||||
| 	INSTR_TIME_SET_CURRENT(endtime); | 	INSTR_TIME_SET_CURRENT(endtime); | ||||||
| 	INSTR_TIME_ACCUM_DIFF(context->base.emission_counter, | 	INSTR_TIME_ACCUM_DIFF(context->base.instr.emission_counter, | ||||||
| 						  endtime, starttime); | 						  endtime, starttime); | ||||||
|  |  | ||||||
| 	context->module = NULL; | 	context->module = NULL; | ||||||
| @@ -596,9 +596,9 @@ llvm_compile_module(LLVMJitContext *context) | |||||||
|  |  | ||||||
| 	ereport(DEBUG1, | 	ereport(DEBUG1, | ||||||
| 			(errmsg("time to inline: %.3fs, opt: %.3fs, emit: %.3fs", | 			(errmsg("time to inline: %.3fs, opt: %.3fs, emit: %.3fs", | ||||||
| 					INSTR_TIME_GET_DOUBLE(context->base.inlining_counter), | 					INSTR_TIME_GET_DOUBLE(context->base.instr.inlining_counter), | ||||||
| 					INSTR_TIME_GET_DOUBLE(context->base.optimization_counter), | 					INSTR_TIME_GET_DOUBLE(context->base.instr.optimization_counter), | ||||||
| 					INSTR_TIME_GET_DOUBLE(context->base.emission_counter)), | 					INSTR_TIME_GET_DOUBLE(context->base.instr.emission_counter)), | ||||||
| 			 errhidestmt(true), | 			 errhidestmt(true), | ||||||
| 			 errhidecontext(true))); | 			 errhidecontext(true))); | ||||||
| } | } | ||||||
|   | |||||||
| @@ -2557,7 +2557,7 @@ llvm_compile_expr(ExprState *state) | |||||||
| 	llvm_leave_fatal_on_oom(); | 	llvm_leave_fatal_on_oom(); | ||||||
|  |  | ||||||
| 	INSTR_TIME_SET_CURRENT(endtime); | 	INSTR_TIME_SET_CURRENT(endtime); | ||||||
| 	INSTR_TIME_ACCUM_DIFF(context->base.generation_counter, | 	INSTR_TIME_ACCUM_DIFF(context->base.instr.generation_counter, | ||||||
| 						  endtime, starttime); | 						  endtime, starttime); | ||||||
|  |  | ||||||
| 	return true; | 	return true; | ||||||
|   | |||||||
| @@ -81,7 +81,8 @@ extern void ExplainOnePlan(PlannedStmt *plannedstmt, IntoClause *into, | |||||||
| extern void ExplainPrintPlan(ExplainState *es, QueryDesc *queryDesc); | extern void ExplainPrintPlan(ExplainState *es, QueryDesc *queryDesc); | ||||||
| extern void ExplainPrintTriggers(ExplainState *es, QueryDesc *queryDesc); | extern void ExplainPrintTriggers(ExplainState *es, QueryDesc *queryDesc); | ||||||
|  |  | ||||||
| extern void ExplainPrintJIT(ExplainState *es, QueryDesc *queryDesc); | extern void ExplainPrintJIT(ExplainState *es, int jit_flags, | ||||||
|  | 				struct JitInstrumentation *jit_instr, int worker_i); | ||||||
|  |  | ||||||
| extern void ExplainQueryText(ExplainState *es, QueryDesc *queryDesc); | extern void ExplainQueryText(ExplainState *es, QueryDesc *queryDesc); | ||||||
|  |  | ||||||
|   | |||||||
| @@ -27,6 +27,7 @@ typedef struct ParallelExecutorInfo | |||||||
| 	ParallelContext *pcxt;		/* parallel context we're using */ | 	ParallelContext *pcxt;		/* parallel context we're using */ | ||||||
| 	BufferUsage *buffer_usage;	/* points to bufusage area in DSM */ | 	BufferUsage *buffer_usage;	/* points to bufusage area in DSM */ | ||||||
| 	SharedExecutorInstrumentation *instrumentation; /* optional */ | 	SharedExecutorInstrumentation *instrumentation; /* optional */ | ||||||
|  | 	struct SharedJitInstrumentation *jit_instrumentation; /* optional */ | ||||||
| 	dsa_area   *area;			/* points to DSA area in DSM */ | 	dsa_area   *area;			/* points to DSA area in DSM */ | ||||||
| 	dsa_pointer param_exec;		/* serialized PARAM_EXEC parameters */ | 	dsa_pointer param_exec;		/* serialized PARAM_EXEC parameters */ | ||||||
| 	bool		finished;		/* set true by ExecParallelFinish */ | 	bool		finished;		/* set true by ExecParallelFinish */ | ||||||
|   | |||||||
| @@ -24,13 +24,8 @@ | |||||||
| #define PGJIT_DEFORM   (1 << 4) | #define PGJIT_DEFORM   (1 << 4) | ||||||
|  |  | ||||||
|  |  | ||||||
| typedef struct JitContext | typedef struct JitInstrumentation | ||||||
| { | { | ||||||
| 	/* see PGJIT_* above */ |  | ||||||
| 	int			flags; |  | ||||||
|  |  | ||||||
| 	ResourceOwner resowner; |  | ||||||
|  |  | ||||||
| 	/* number of emitted functions */ | 	/* number of emitted functions */ | ||||||
| 	size_t		created_functions; | 	size_t		created_functions; | ||||||
|  |  | ||||||
| @@ -45,6 +40,25 @@ typedef struct JitContext | |||||||
|  |  | ||||||
| 	/* accumulated time for code emission */ | 	/* accumulated time for code emission */ | ||||||
| 	instr_time	emission_counter; | 	instr_time	emission_counter; | ||||||
|  | } JitInstrumentation; | ||||||
|  |  | ||||||
|  | /* | ||||||
|  |  * DSM structure for accumulating jit instrumentation of all workers. | ||||||
|  |  */ | ||||||
|  | typedef struct SharedJitInstrumentation | ||||||
|  | { | ||||||
|  | 	int			num_workers; | ||||||
|  | 	JitInstrumentation jit_instr[FLEXIBLE_ARRAY_MEMBER]; | ||||||
|  | } SharedJitInstrumentation; | ||||||
|  |  | ||||||
|  | typedef struct JitContext | ||||||
|  | { | ||||||
|  | 	/* see PGJIT_* above */ | ||||||
|  | 	int			flags; | ||||||
|  |  | ||||||
|  | 	ResourceOwner resowner; | ||||||
|  |  | ||||||
|  | 	JitInstrumentation instr; | ||||||
| } JitContext; | } JitContext; | ||||||
|  |  | ||||||
| typedef struct JitProviderCallbacks JitProviderCallbacks; | typedef struct JitProviderCallbacks JitProviderCallbacks; | ||||||
| @@ -85,6 +99,7 @@ extern void jit_release_context(JitContext *context); | |||||||
|  * not be able to perform JIT (i.e. return false). |  * not be able to perform JIT (i.e. return false). | ||||||
|  */ |  */ | ||||||
| extern bool jit_compile_expr(struct ExprState *state); | extern bool jit_compile_expr(struct ExprState *state); | ||||||
|  | extern void InstrJitAgg(JitInstrumentation *dst, JitInstrumentation *add); | ||||||
|  |  | ||||||
|  |  | ||||||
| #endif							/* JIT_H */ | #endif							/* JIT_H */ | ||||||
|   | |||||||
| @@ -569,9 +569,14 @@ typedef struct EState | |||||||
| 	 * JIT information. es_jit_flags indicates whether JIT should be performed | 	 * JIT information. es_jit_flags indicates whether JIT should be performed | ||||||
| 	 * and with which options.  es_jit is created on-demand when JITing is | 	 * and with which options.  es_jit is created on-demand when JITing is | ||||||
| 	 * performed. | 	 * performed. | ||||||
|  | 	 * | ||||||
|  | 	 * es_jit_combined_instr, at the end of query execution with | ||||||
|  | 	 * instrumentation enabled, is the the combined instrumentation | ||||||
|  | 	 * information of leader and followers. | ||||||
| 	 */ | 	 */ | ||||||
| 	int			es_jit_flags; | 	int			es_jit_flags; | ||||||
| 	struct JitContext *es_jit; | 	struct JitContext *es_jit; | ||||||
|  | 	struct JitInstrumentation *es_jit_combined_instr; | ||||||
| } EState; | } EState; | ||||||
|  |  | ||||||
|  |  | ||||||
| @@ -923,6 +928,9 @@ typedef struct PlanState | |||||||
| 	Instrumentation *instrument;	/* Optional runtime stats for this node */ | 	Instrumentation *instrument;	/* Optional runtime stats for this node */ | ||||||
| 	WorkerInstrumentation *worker_instrument;	/* per-worker instrumentation */ | 	WorkerInstrumentation *worker_instrument;	/* per-worker instrumentation */ | ||||||
|  |  | ||||||
|  | 	/* Per-worker JIT instrumentation */ | ||||||
|  | 	struct SharedJitInstrumentation *worker_jit_instrument; | ||||||
|  |  | ||||||
| 	/* | 	/* | ||||||
| 	 * Common structural data for all Plan types.  These links to subsidiary | 	 * Common structural data for all Plan types.  These links to subsidiary | ||||||
| 	 * state trees parallel links in the associated plan tree (except for the | 	 * state trees parallel links in the associated plan tree (except for the | ||||||
|   | |||||||
		Reference in New Issue
	
	Block a user