mirror of
https://github.com/postgres/postgres.git
synced 2025-07-21 16:02:15 +03:00
Fix bitmapheapscan incorrect recheck of NULL tuples
The bitmap heap scan skip fetch optimization skips fetching the heap block when a page is set all-visible in the visibility map and no columns from the table are needed to satisfy the query.2b73a8cd33
andc3953226a0
changed the control flow of bitmap heap scan to use the read stream API. The read stream API returns buffers containing blocks to the user. To make this work with the skip fetch optimization, we keep a count of the empty tuples we need to emit for all the blocks skipped and only emit the empty tuples after processing the next block fetched from the heap or at the end of the scan. It's incorrect to recheck NULL tuples, so we must set `recheck` to false before yielding control back to BitmapHeapNext(). This was done before emitting any remaining empty tuples at the end of the scan but not for empty tuples emitted during the scan. This meant that if a page fetched from the heap did require recheck and set `recheck` to true and then we emitted empty tuples for subsequent blocks, we would get wrong results. Fix this by always setting `recheck` to false before emitting empty tuples. Reported-by: Alexander Lakhin <exclusion@gmail.com> Tested-by: Andres Freund <andres@anarazel.de> Discussion: https://postgr.es/m/496f7acd-881c-4df3-9bd3-8f8534dfec26%40gmail.com
This commit is contained in:
@ -2147,6 +2147,19 @@ heapam_scan_bitmap_next_tuple(TableScanDesc scan,
|
|||||||
*/
|
*/
|
||||||
ExecStoreAllNullTuple(slot);
|
ExecStoreAllNullTuple(slot);
|
||||||
bscan->rs_empty_tuples_pending--;
|
bscan->rs_empty_tuples_pending--;
|
||||||
|
|
||||||
|
/*
|
||||||
|
* We do not recheck all NULL tuples. Because the streaming read
|
||||||
|
* API only yields TBMIterateResults for blocks actually fetched
|
||||||
|
* from the heap, we must unset `recheck` ourselves here to ensure
|
||||||
|
* correct results.
|
||||||
|
*
|
||||||
|
* Our read stream callback accrues a count of empty tuples to
|
||||||
|
* emit and then emits them after emitting tuples from the next
|
||||||
|
* fetched block. If no blocks need fetching, we'll emit the
|
||||||
|
* accrued count at the end of the scan.
|
||||||
|
*/
|
||||||
|
*recheck = false;
|
||||||
return true;
|
return true;
|
||||||
}
|
}
|
||||||
|
|
||||||
@ -2510,13 +2523,14 @@ BitmapHeapScanNextBlock(TableScanDesc scan,
|
|||||||
}
|
}
|
||||||
|
|
||||||
/*
|
/*
|
||||||
* Bitmap is exhausted. Time to emit empty tuples if relevant. We emit
|
* The bitmap is exhausted. Now emit any remaining empty tuples. The
|
||||||
* all empty tuples at the end instead of emitting them per block we
|
* read stream API only returns TBMIterateResults for blocks actually
|
||||||
* skip fetching. This is necessary because the streaming read API
|
* fetched from the heap. Our callback will accrue a count of empty
|
||||||
* will only return TBMIterateResults for blocks actually fetched.
|
* tuples to emit for all blocks we skipped fetching. So, if we skip
|
||||||
* When we skip fetching a block, we keep track of how many empty
|
* fetching heap blocks at the end of the relation (or no heap blocks
|
||||||
* tuples to emit at the end of the BitmapHeapScan. We do not recheck
|
* are fetched) we need to ensure we emit empty tuples before ending
|
||||||
* all NULL tuples.
|
* the scan. We don't recheck empty tuples so ensure `recheck` is
|
||||||
|
* unset.
|
||||||
*/
|
*/
|
||||||
*recheck = false;
|
*recheck = false;
|
||||||
return bscan->rs_empty_tuples_pending > 0;
|
return bscan->rs_empty_tuples_pending > 0;
|
||||||
|
@ -8,7 +8,7 @@
|
|||||||
-- there's a maximum number of a,b combinations in the table.
|
-- there's a maximum number of a,b combinations in the table.
|
||||||
-- That allows us to test all the different combinations of
|
-- That allows us to test all the different combinations of
|
||||||
-- lossy and non-lossy pages with the minimum amount of data
|
-- lossy and non-lossy pages with the minimum amount of data
|
||||||
CREATE TABLE bmscantest (a int, b int, t text);
|
CREATE TABLE bmscantest (a int, b int, t text) WITH (autovacuum_enabled = false);
|
||||||
INSERT INTO bmscantest
|
INSERT INTO bmscantest
|
||||||
SELECT (r%53), (r%59), 'foooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooo'
|
SELECT (r%53), (r%59), 'foooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooo'
|
||||||
FROM generate_series(1,70000) r;
|
FROM generate_series(1,70000) r;
|
||||||
@ -20,7 +20,17 @@ set enable_indexscan=false;
|
|||||||
set enable_seqscan=false;
|
set enable_seqscan=false;
|
||||||
-- Lower work_mem to trigger use of lossy bitmaps
|
-- Lower work_mem to trigger use of lossy bitmaps
|
||||||
set work_mem = 64;
|
set work_mem = 64;
|
||||||
-- Test bitmap-and.
|
-- Test bitmap-and without the skip fetch optimization.
|
||||||
|
SELECT count(*) FROM bmscantest WHERE a = 1 AND b = 1;
|
||||||
|
count
|
||||||
|
-------
|
||||||
|
23
|
||||||
|
(1 row)
|
||||||
|
|
||||||
|
-- Test that we return correct results when using the skip fetch optimization
|
||||||
|
-- VACUUM FREEZE will set all the pages in the relation all-visible, enabling
|
||||||
|
-- the optimization.
|
||||||
|
VACUUM (FREEZE) bmscantest;
|
||||||
SELECT count(*) FROM bmscantest WHERE a = 1 AND b = 1;
|
SELECT count(*) FROM bmscantest WHERE a = 1 AND b = 1;
|
||||||
count
|
count
|
||||||
-------
|
-------
|
||||||
|
@ -12,7 +12,7 @@
|
|||||||
-- That allows us to test all the different combinations of
|
-- That allows us to test all the different combinations of
|
||||||
-- lossy and non-lossy pages with the minimum amount of data
|
-- lossy and non-lossy pages with the minimum amount of data
|
||||||
|
|
||||||
CREATE TABLE bmscantest (a int, b int, t text);
|
CREATE TABLE bmscantest (a int, b int, t text) WITH (autovacuum_enabled = false);
|
||||||
|
|
||||||
INSERT INTO bmscantest
|
INSERT INTO bmscantest
|
||||||
SELECT (r%53), (r%59), 'foooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooo'
|
SELECT (r%53), (r%59), 'foooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooo'
|
||||||
@ -29,8 +29,14 @@ set enable_seqscan=false;
|
|||||||
-- Lower work_mem to trigger use of lossy bitmaps
|
-- Lower work_mem to trigger use of lossy bitmaps
|
||||||
set work_mem = 64;
|
set work_mem = 64;
|
||||||
|
|
||||||
|
-- Test bitmap-and without the skip fetch optimization.
|
||||||
|
SELECT count(*) FROM bmscantest WHERE a = 1 AND b = 1;
|
||||||
|
|
||||||
|
-- Test that we return correct results when using the skip fetch optimization
|
||||||
|
-- VACUUM FREEZE will set all the pages in the relation all-visible, enabling
|
||||||
|
-- the optimization.
|
||||||
|
VACUUM (FREEZE) bmscantest;
|
||||||
|
|
||||||
-- Test bitmap-and.
|
|
||||||
SELECT count(*) FROM bmscantest WHERE a = 1 AND b = 1;
|
SELECT count(*) FROM bmscantest WHERE a = 1 AND b = 1;
|
||||||
|
|
||||||
-- Test bitmap-or.
|
-- Test bitmap-or.
|
||||||
|
Reference in New Issue
Block a user