mirror of
https://github.com/postgres/postgres.git
synced 2025-11-19 13:42:17 +03:00
Use column collation for extended statistics
The current extended statistics code was a bit confused which collation to use. When building the statistics, the collations defined as default for the data types were used (since commit5e0928005). The MCV code was however using the column collations for MCV serialization, and then DEFAULT_COLLATION_OID when computing estimates. So overall the code was using all three possible options, inconsistently. This uses the column colation everywhere - this makes it consistent with what5e0928005did for regular stats. We however do not track the collations in a catalog, because we can derive them from column-level information. This may need to change in the future, e.g. after allowing statistics on expressions. Reviewed-by: Tom Lane Discussion: https://postgr.es/m/8736jdhbhc.fsf%40ansel.ydns.eu Backpatch-to: 12
This commit is contained in:
@@ -366,7 +366,7 @@ build_mss(VacAttrStats **stats, int numattrs)
|
||||
elog(ERROR, "cache lookup failed for ordering operator for type %u",
|
||||
colstat->attrtypid);
|
||||
|
||||
multi_sort_add_dimension(mss, i, type->lt_opr, type->typcollation);
|
||||
multi_sort_add_dimension(mss, i, type->lt_opr, colstat->attrcollid);
|
||||
}
|
||||
|
||||
return mss;
|
||||
@@ -686,7 +686,7 @@ statext_mcv_serialize(MCVList *mcvlist, VacAttrStats **stats)
|
||||
|
||||
/* sort and deduplicate the data */
|
||||
ssup[dim].ssup_cxt = CurrentMemoryContext;
|
||||
ssup[dim].ssup_collation = DEFAULT_COLLATION_OID;
|
||||
ssup[dim].ssup_collation = stats[dim]->attrcollid;
|
||||
ssup[dim].ssup_nulls_first = false;
|
||||
|
||||
PrepareSortSupportFromOrderingOp(typentry->lt_opr, &ssup[dim]);
|
||||
@@ -1630,15 +1630,22 @@ mcv_get_match_bitmap(PlannerInfo *root, List *clauses,
|
||||
* First check whether the constant is below the lower
|
||||
* boundary (in that case we can skip the bucket, because
|
||||
* there's no overlap).
|
||||
*
|
||||
* We don't store collations used to build the statistics,
|
||||
* but we can use the collation for the attribute itself,
|
||||
* as stored in varcollid. We do reset the statistics after
|
||||
* a type change (including collation change), so this is
|
||||
* OK. We may need to relax this after allowing extended
|
||||
* statistics on expressions.
|
||||
*/
|
||||
if (varonleft)
|
||||
match = DatumGetBool(FunctionCall2Coll(&opproc,
|
||||
DEFAULT_COLLATION_OID,
|
||||
var->varcollid,
|
||||
item->values[idx],
|
||||
cst->constvalue));
|
||||
else
|
||||
match = DatumGetBool(FunctionCall2Coll(&opproc,
|
||||
DEFAULT_COLLATION_OID,
|
||||
var->varcollid,
|
||||
cst->constvalue,
|
||||
item->values[idx]));
|
||||
|
||||
|
||||
Reference in New Issue
Block a user