mirror of
				https://github.com/postgres/postgres.git
				synced 2025-10-25 13:17:41 +03:00 
			
		
		
		
	Fix past pd_upper write in ginRedoRecompress()
ginRedoRecompress() replays actions over compressed segments of posting list in-place. However, it might lead to write past pg_upper, because intermediate state during playing the changes can take more space than both original state and final state. This commit fixes that by refuse from in-place modification. Instead page tail is copied once modification is started, and then it's used as the source of original segments. Backpatch to 9.4 where posting list compression was introduced. Reported-by: Sivasubramanian Ramasubramanian Discussion: https://postgr.es/m/1536091151804.6588%40amazon.com Author: Alexander Korotkov based on patch from and ideas by Sivasubramanian Ramasubramanian Review: Sivasubramanian Ramasubramanian Backpatch-through: 9.4
This commit is contained in:
		| @@ -142,6 +142,14 @@ ginRedoInsertEntry(Buffer buffer, bool isLeaf, BlockNumber rightblkno, void *rda | |||||||
| 	} | 	} | ||||||
| } | } | ||||||
|  |  | ||||||
|  | /* | ||||||
|  |  * Redo recompression of posting list.  Doing all the changes in-place is not | ||||||
|  |  * always possible, because it might require more space than we've on the page. | ||||||
|  |  * Instead, once modification is required we copy unprocessed tail of the page | ||||||
|  |  * into separately allocated chunk of memory for further reading original | ||||||
|  |  * versions of segments.  Thanks to that we don't bother about moving page data | ||||||
|  |  * in-place. | ||||||
|  |  */ | ||||||
| static void | static void | ||||||
| ginRedoRecompress(Page page, ginxlogRecompressDataLeaf *data) | ginRedoRecompress(Page page, ginxlogRecompressDataLeaf *data) | ||||||
| { | { | ||||||
| @@ -151,6 +159,9 @@ ginRedoRecompress(Page page, ginxlogRecompressDataLeaf *data) | |||||||
| 	Pointer		segmentend; | 	Pointer		segmentend; | ||||||
| 	char	   *walbuf; | 	char	   *walbuf; | ||||||
| 	int			totalsize; | 	int			totalsize; | ||||||
|  | 	Pointer		tailCopy = NULL; | ||||||
|  | 	Pointer		writePtr; | ||||||
|  | 	Pointer		segptr; | ||||||
|  |  | ||||||
| 	/* | 	/* | ||||||
| 	 * If the page is in pre-9.4 format, convert to new format first. | 	 * If the page is in pre-9.4 format, convert to new format first. | ||||||
| @@ -190,6 +201,7 @@ ginRedoRecompress(Page page, ginxlogRecompressDataLeaf *data) | |||||||
| 	} | 	} | ||||||
|  |  | ||||||
| 	oldseg = GinDataLeafPageGetPostingList(page); | 	oldseg = GinDataLeafPageGetPostingList(page); | ||||||
|  | 	writePtr = (Pointer) oldseg; | ||||||
| 	segmentend = (Pointer) oldseg + GinDataLeafPageGetPostingListSize(page); | 	segmentend = (Pointer) oldseg + GinDataLeafPageGetPostingListSize(page); | ||||||
| 	segno = 0; | 	segno = 0; | ||||||
|  |  | ||||||
| @@ -207,8 +219,6 @@ ginRedoRecompress(Page page, ginxlogRecompressDataLeaf *data) | |||||||
| 		ItemPointerData *newitems; | 		ItemPointerData *newitems; | ||||||
| 		int			nnewitems; | 		int			nnewitems; | ||||||
| 		int			segsize; | 		int			segsize; | ||||||
| 		Pointer		segptr; |  | ||||||
| 		int			szleft; |  | ||||||
|  |  | ||||||
| 		/* Extract all the information we need from the WAL record */ | 		/* Extract all the information we need from the WAL record */ | ||||||
| 		if (a_action == GIN_SEGMENT_INSERT || | 		if (a_action == GIN_SEGMENT_INSERT || | ||||||
| @@ -231,6 +241,17 @@ ginRedoRecompress(Page page, ginxlogRecompressDataLeaf *data) | |||||||
| 		Assert(segno <= a_segno); | 		Assert(segno <= a_segno); | ||||||
| 		while (segno < a_segno) | 		while (segno < a_segno) | ||||||
| 		{ | 		{ | ||||||
|  | 			/* | ||||||
|  | 			 * Once modification is started and page tail is copied, we've | ||||||
|  | 			 * to copy unmodified segments. | ||||||
|  | 			 */ | ||||||
|  | 			segsize = SizeOfGinPostingList(oldseg); | ||||||
|  | 			if (tailCopy) | ||||||
|  | 			{ | ||||||
|  | 				Assert(writePtr + segsize < PageGetSpecialPointer(page)); | ||||||
|  | 				memcpy(writePtr, (Pointer) oldseg, segsize); | ||||||
|  | 			} | ||||||
|  | 			writePtr += segsize; | ||||||
| 			oldseg = GinNextPostingListSegment(oldseg); | 			oldseg = GinNextPostingListSegment(oldseg); | ||||||
| 			segno++; | 			segno++; | ||||||
| 		} | 		} | ||||||
| @@ -271,36 +292,42 @@ ginRedoRecompress(Page page, ginxlogRecompressDataLeaf *data) | |||||||
| 			Assert(a_action == GIN_SEGMENT_INSERT); | 			Assert(a_action == GIN_SEGMENT_INSERT); | ||||||
| 			segsize = 0; | 			segsize = 0; | ||||||
| 		} | 		} | ||||||
| 		szleft = segmentend - segptr; |  | ||||||
|  | 		/* | ||||||
|  | 		 * We're about to start modification of the page.  So, copy tail of the | ||||||
|  | 		 * page if it's not done already. | ||||||
|  | 		 */ | ||||||
|  | 		if (!tailCopy && segptr != segmentend) | ||||||
|  | 		{ | ||||||
|  | 			int tailSize = segmentend - segptr; | ||||||
|  |  | ||||||
|  | 			tailCopy = (Pointer) palloc(tailSize); | ||||||
|  | 			memcpy(tailCopy, segptr, tailSize); | ||||||
|  | 			segptr = tailCopy; | ||||||
|  | 			oldseg = (GinPostingList *) segptr; | ||||||
|  | 			segmentend = segptr + tailSize; | ||||||
|  | 		} | ||||||
|  |  | ||||||
| 		switch (a_action) | 		switch (a_action) | ||||||
| 		{ | 		{ | ||||||
| 			case GIN_SEGMENT_DELETE: | 			case GIN_SEGMENT_DELETE: | ||||||
| 				memmove(segptr, segptr + segsize, szleft - segsize); | 				segptr += segsize; | ||||||
| 				segmentend -= segsize; |  | ||||||
|  |  | ||||||
| 				segno++; | 				segno++; | ||||||
| 				break; | 				break; | ||||||
|  |  | ||||||
| 			case GIN_SEGMENT_INSERT: | 			case GIN_SEGMENT_INSERT: | ||||||
| 				/* make room for the new segment */ |  | ||||||
| 				memmove(segptr + newsegsize, segptr, szleft); |  | ||||||
| 				/* copy the new segment in place */ | 				/* copy the new segment in place */ | ||||||
| 				memcpy(segptr, newseg, newsegsize); | 				Assert(writePtr + newsegsize <= PageGetSpecialPointer(page)); | ||||||
| 				segmentend += newsegsize; | 				memcpy(writePtr, newseg, newsegsize); | ||||||
| 				segptr += newsegsize; | 				writePtr += newsegsize; | ||||||
| 				break; | 				break; | ||||||
|  |  | ||||||
| 			case GIN_SEGMENT_REPLACE: | 			case GIN_SEGMENT_REPLACE: | ||||||
| 				/* shift the segments that follow */ | 				/* copy the new version of segment in place */ | ||||||
| 				memmove(segptr + newsegsize, | 				Assert(writePtr + newsegsize <= PageGetSpecialPointer(page)); | ||||||
| 						segptr + segsize, | 				memcpy(writePtr, newseg, newsegsize); | ||||||
| 						szleft - segsize); | 				writePtr += newsegsize; | ||||||
| 				/* copy the replacement segment in place */ | 				segptr += segsize; | ||||||
| 				memcpy(segptr, newseg, newsegsize); |  | ||||||
| 				segmentend -= segsize; |  | ||||||
| 				segmentend += newsegsize; |  | ||||||
| 				segptr += newsegsize; |  | ||||||
| 				segno++; | 				segno++; | ||||||
| 				break; | 				break; | ||||||
|  |  | ||||||
| @@ -310,7 +337,18 @@ ginRedoRecompress(Page page, ginxlogRecompressDataLeaf *data) | |||||||
| 		oldseg = (GinPostingList *) segptr; | 		oldseg = (GinPostingList *) segptr; | ||||||
| 	} | 	} | ||||||
|  |  | ||||||
| 	totalsize = segmentend - (Pointer) GinDataLeafPageGetPostingList(page); | 	/* Copy the rest of unmodified segments if any. */ | ||||||
|  | 	segptr = (Pointer) oldseg; | ||||||
|  | 	if (segptr != segmentend && tailCopy) | ||||||
|  | 	{ | ||||||
|  | 		int restSize = segmentend - segptr; | ||||||
|  |  | ||||||
|  | 		Assert(writePtr + restSize <= PageGetSpecialPointer(page)); | ||||||
|  | 		memcpy(writePtr, segptr, restSize); | ||||||
|  | 		writePtr += restSize; | ||||||
|  | 	} | ||||||
|  |  | ||||||
|  | 	totalsize = writePtr - (Pointer) GinDataLeafPageGetPostingList(page); | ||||||
| 	GinDataPageSetDataSize(page, totalsize); | 	GinDataPageSetDataSize(page, totalsize); | ||||||
| } | } | ||||||
|  |  | ||||||
|   | |||||||
		Reference in New Issue
	
	Block a user