ATRewriteTable() calls table_tuple_insert() with a bistate, to avoid clobbering and polluting the buffers.
But heap_insert() then calls heap_prepare_insert() > heap_toast_insert_or_update > toast_tuple_externalize > toast_save_datum > heap_insert(toastrel, toasttup, mycid, options, NULL /* without bistate:( */); I came up with this patch. I'm not sure but maybe it should be implemented at the tableam layer and not inside heap. Maybe the BulkInsertState should have a 2nd strategy buffer for toast tables. CREATE TABLE t(i int, a text, b text, c text,d text,e text,f text,g text); INSERT INTO t SELECT 0, array_agg(a),array_agg(a),array_agg(a),array_agg(a),array_agg(a),array_agg(a) FROM generate_series(1,999)n,repeat(n::text,99)a,generate_series(1,99)b GROUP BY b; INSERT INTO t SELECT * FROM t; INSERT INTO t SELECT * FROM t; INSERT INTO t SELECT * FROM t; INSERT INTO t SELECT * FROM t; ALTER TABLE t ALTER i TYPE smallint; SELECT COUNT(1), relname, COUNT(1) FILTER(WHERE isdirty) FROM pg_buffercache b JOIN pg_class c ON c.oid=b.relfilenode GROUP BY 2 ORDER BY 1 DESC LIMIT 9; Without this patch: postgres=# SELECT COUNT(1), relname, COUNT(1) FILTER(WHERE isdirty) FROM pg_buffercache b JOIN pg_class c ON c.oid=b.relfilenode GROUP BY 2 ORDER BY 1 DESC LIMIT 9; 10283 | pg_toast_55759 | 8967 With this patch: 1418 | pg_toast_16597 | 1418 -- Justin
>From 2b156036856dcbeab00de819e5c6eff820b564cd Mon Sep 17 00:00:00 2001 From: Justin Pryzby <pryz...@telsasoft.com> Date: Tue, 21 Jun 2022 22:28:06 -0500 Subject: [PATCH] WIP: use BulkInsertState for toast tuples, too ci-os-only: linux --- src/backend/access/common/toast_internals.c | 16 ++++++++++++++-- src/backend/access/heap/heapam.c | 14 ++++++++------ src/backend/access/heap/heaptoast.c | 11 +++++++---- src/backend/access/heap/rewriteheap.c | 2 +- src/backend/access/table/toast_helper.c | 6 ++++-- src/include/access/heaptoast.h | 4 +++- src/include/access/toast_helper.h | 3 ++- src/include/access/toast_internals.h | 4 +++- 8 files changed, 42 insertions(+), 18 deletions(-) diff --git a/src/backend/access/common/toast_internals.c b/src/backend/access/common/toast_internals.c index 576e585a89f..2640e6a1589 100644 --- a/src/backend/access/common/toast_internals.c +++ b/src/backend/access/common/toast_internals.c @@ -118,7 +118,8 @@ toast_compress_datum(Datum value, char cmethod) */ Datum toast_save_datum(Relation rel, Datum value, - struct varlena *oldexternal, int options) + struct varlena *oldexternal, int options, + BulkInsertState bistate) { Relation toastrel; Relation *toastidxs; @@ -299,6 +300,10 @@ toast_save_datum(Relation rel, Datum value, t_isnull[1] = false; t_isnull[2] = false; + /* Release pin after main table, before switching to write to toast table */ + if (bistate) + ReleaseBulkInsertStatePin(bistate); + /* * Split up the item into chunks */ @@ -321,7 +326,7 @@ toast_save_datum(Relation rel, Datum value, memcpy(VARDATA(&chunk_data), data_p, chunk_size); toasttup = heap_form_tuple(toasttupDesc, t_values, t_isnull); - heap_insert(toastrel, toasttup, mycid, options, NULL); + heap_insert(toastrel, toasttup, mycid, options, bistate); /* * Create the index entry. We cheat a little here by not using @@ -358,6 +363,13 @@ toast_save_datum(Relation rel, Datum value, data_p += chunk_size; } + if (bistate) + { + table_finish_bulk_insert(toastrel, options); // XXX + /* Release pin after writing toast table before resuming writes to the main table */ + ReleaseBulkInsertStatePin(bistate); + } + /* * Done - close toast relation and its indexes but keep the lock until * commit, so as a concurrent reindex done directly on the toast relation diff --git a/src/backend/access/heap/heapam.c b/src/backend/access/heap/heapam.c index 74218510276..e46a6035068 100644 --- a/src/backend/access/heap/heapam.c +++ b/src/backend/access/heap/heapam.c @@ -73,7 +73,8 @@ static HeapTuple heap_prepare_insert(Relation relation, HeapTuple tup, - TransactionId xid, CommandId cid, int options); + TransactionId xid, CommandId cid, int options, + BulkInsertState bistate); static XLogRecPtr log_heap_update(Relation reln, Buffer oldbuf, Buffer newbuf, HeapTuple oldtup, HeapTuple newtup, HeapTuple old_key_tuple, @@ -2042,7 +2043,8 @@ heap_insert(Relation relation, HeapTuple tup, CommandId cid, * Note: below this point, heaptup is the data we actually intend to store * into the relation; tup is the caller's original untoasted data. */ - heaptup = heap_prepare_insert(relation, tup, xid, cid, options); + + heaptup = heap_prepare_insert(relation, tup, xid, cid, options, bistate); /* * Find buffer to insert this tuple into. If the page is all visible, @@ -2212,7 +2214,7 @@ heap_insert(Relation relation, HeapTuple tup, CommandId cid, */ static HeapTuple heap_prepare_insert(Relation relation, HeapTuple tup, TransactionId xid, - CommandId cid, int options) + CommandId cid, int options, BulkInsertState bistate) { /* * To allow parallel inserts, we need to ensure that they are safe to be @@ -2248,7 +2250,7 @@ heap_prepare_insert(Relation relation, HeapTuple tup, TransactionId xid, return tup; } else if (HeapTupleHasExternal(tup) || tup->t_len > TOAST_TUPLE_THRESHOLD) - return heap_toast_insert_or_update(relation, tup, NULL, options); + return heap_toast_insert_or_update(relation, tup, NULL, options, bistate); else return tup; } @@ -2297,7 +2299,7 @@ heap_multi_insert(Relation relation, TupleTableSlot **slots, int ntuples, slots[i]->tts_tableOid = RelationGetRelid(relation); tuple->t_tableOid = slots[i]->tts_tableOid; heaptuples[i] = heap_prepare_insert(relation, tuple, xid, cid, - options); + options, NULL); } /* @@ -3724,7 +3726,7 @@ l2: if (need_toast) { /* Note we always use WAL and FSM during updates */ - heaptup = heap_toast_insert_or_update(relation, newtup, &oldtup, 0); + heaptup = heap_toast_insert_or_update(relation, newtup, &oldtup, 0, NULL); newtupsize = MAXALIGN(heaptup->t_len); } else diff --git a/src/backend/access/heap/heaptoast.c b/src/backend/access/heap/heaptoast.c index 1575a81b01b..25b07f82cb6 100644 --- a/src/backend/access/heap/heaptoast.c +++ b/src/backend/access/heap/heaptoast.c @@ -94,7 +94,7 @@ heap_toast_delete(Relation rel, HeapTuple oldtup, bool is_speculative) */ HeapTuple heap_toast_insert_or_update(Relation rel, HeapTuple newtup, HeapTuple oldtup, - int options) + int options, BulkInsertState bistate) { HeapTuple result_tuple; TupleDesc tupleDesc; @@ -110,6 +110,9 @@ heap_toast_insert_or_update(Relation rel, HeapTuple newtup, HeapTuple oldtup, ToastAttrInfo toast_attr[MaxHeapAttributeNumber]; ToastTupleContext ttc; + /* Bulk insert is not supported for updates, only inserts. */ + Assert(bistate == NULL || oldtup == NULL); + /* * Ignore the INSERT_SPECULATIVE option. Speculative insertions/super * deletions just normally insert/delete the toast values. It seems @@ -214,7 +217,7 @@ heap_toast_insert_or_update(Relation rel, HeapTuple newtup, HeapTuple oldtup, */ if (toast_attr[biggest_attno].tai_size > maxDataLen && rel->rd_rel->reltoastrelid != InvalidOid) - toast_tuple_externalize(&ttc, biggest_attno, options); + toast_tuple_externalize(&ttc, biggest_attno, options, bistate); } /* @@ -231,7 +234,7 @@ heap_toast_insert_or_update(Relation rel, HeapTuple newtup, HeapTuple oldtup, biggest_attno = toast_tuple_find_biggest_attribute(&ttc, false, false); if (biggest_attno < 0) break; - toast_tuple_externalize(&ttc, biggest_attno, options); + toast_tuple_externalize(&ttc, biggest_attno, options, bistate); } /* @@ -267,7 +270,7 @@ heap_toast_insert_or_update(Relation rel, HeapTuple newtup, HeapTuple oldtup, if (biggest_attno < 0) break; - toast_tuple_externalize(&ttc, biggest_attno, options); + toast_tuple_externalize(&ttc, biggest_attno, options, bistate); } /* diff --git a/src/backend/access/heap/rewriteheap.c b/src/backend/access/heap/rewriteheap.c index 2a53826736e..caff247472f 100644 --- a/src/backend/access/heap/rewriteheap.c +++ b/src/backend/access/heap/rewriteheap.c @@ -644,7 +644,7 @@ raw_heap_insert(RewriteState state, HeapTuple tup) options |= HEAP_INSERT_NO_LOGICAL; heaptup = heap_toast_insert_or_update(state->rs_new_rel, tup, NULL, - options); + options, NULL); // XXX } else heaptup = tup; diff --git a/src/backend/access/table/toast_helper.c b/src/backend/access/table/toast_helper.c index 0cc5a30f9b4..764c7a265d5 100644 --- a/src/backend/access/table/toast_helper.c +++ b/src/backend/access/table/toast_helper.c @@ -15,6 +15,7 @@ #include "postgres.h" #include "access/detoast.h" +#include "access/hio.h" #include "access/table.h" #include "access/toast_helper.h" #include "access/toast_internals.h" @@ -253,7 +254,8 @@ toast_tuple_try_compression(ToastTupleContext *ttc, int attribute) * Move an attribute to external storage. */ void -toast_tuple_externalize(ToastTupleContext *ttc, int attribute, int options) +toast_tuple_externalize(ToastTupleContext *ttc, int attribute, int options, + BulkInsertStateData *bistate) { Datum *value = &ttc->ttc_values[attribute]; Datum old_value = *value; @@ -261,7 +263,7 @@ toast_tuple_externalize(ToastTupleContext *ttc, int attribute, int options) attr->tai_colflags |= TOASTCOL_IGNORE; *value = toast_save_datum(ttc->ttc_rel, old_value, attr->tai_oldexternal, - options); + options, bistate); if ((attr->tai_colflags & TOASTCOL_NEEDS_FREE) != 0) pfree(DatumGetPointer(old_value)); attr->tai_colflags |= TOASTCOL_NEEDS_FREE; diff --git a/src/include/access/heaptoast.h b/src/include/access/heaptoast.h index a75699054af..2db01894c52 100644 --- a/src/include/access/heaptoast.h +++ b/src/include/access/heaptoast.h @@ -13,6 +13,7 @@ #ifndef HEAPTOAST_H #define HEAPTOAST_H +#include "access/hio.h" #include "access/htup_details.h" #include "storage/lockdefs.h" #include "utils/relcache.h" @@ -95,7 +96,8 @@ * ---------- */ extern HeapTuple heap_toast_insert_or_update(Relation rel, HeapTuple newtup, - HeapTuple oldtup, int options); + HeapTuple oldtup, int options, + BulkInsertStateData *bistate); /* ---------- * heap_toast_delete - diff --git a/src/include/access/toast_helper.h b/src/include/access/toast_helper.h index 1e2aaf3303e..46c358b1c29 100644 --- a/src/include/access/toast_helper.h +++ b/src/include/access/toast_helper.h @@ -14,6 +14,7 @@ #ifndef TOAST_HELPER_H #define TOAST_HELPER_H +#include "access/hio.h" #include "utils/rel.h" /* @@ -107,7 +108,7 @@ extern int toast_tuple_find_biggest_attribute(ToastTupleContext *ttc, bool check_main); extern void toast_tuple_try_compression(ToastTupleContext *ttc, int attribute); extern void toast_tuple_externalize(ToastTupleContext *ttc, int attribute, - int options); + int options, BulkInsertStateData *bistate); extern void toast_tuple_cleanup(ToastTupleContext *ttc); extern void toast_delete_external(Relation rel, Datum *values, bool *isnull, diff --git a/src/include/access/toast_internals.h b/src/include/access/toast_internals.h index 85e7dc0fc5f..a9265a1856b 100644 --- a/src/include/access/toast_internals.h +++ b/src/include/access/toast_internals.h @@ -12,6 +12,7 @@ #ifndef TOAST_INTERNALS_H #define TOAST_INTERNALS_H +#include "access/hio.h" #include "access/toast_compression.h" #include "storage/lockdefs.h" #include "utils/relcache.h" @@ -50,7 +51,8 @@ extern Oid toast_get_valid_index(Oid toastoid, LOCKMODE lock); extern void toast_delete_datum(Relation rel, Datum value, bool is_speculative); extern Datum toast_save_datum(Relation rel, Datum value, - struct varlena *oldexternal, int options); + struct varlena *oldexternal, int options, + BulkInsertStateData *bistate); extern int toast_open_indexes(Relation toastrel, LOCKMODE lock, -- 2.17.1