Branch data Line data Source code
1 : : /* -------------------------------------------------------------------------
2 : : *
3 : : * pgstat_relation.c
4 : : * Implementation of relation statistics.
5 : : *
6 : : * This file contains the implementation of relation statistics. It is kept
7 : : * separate from pgstat.c to enforce the line between the statistics access /
8 : : * storage implementation and the details about individual types of
9 : : * statistics.
10 : : *
11 : : * Copyright (c) 2001-2026, PostgreSQL Global Development Group
12 : : *
13 : : * IDENTIFICATION
14 : : * src/backend/utils/activity/pgstat_relation.c
15 : : * -------------------------------------------------------------------------
16 : : */
17 : :
18 : : #include "postgres.h"
19 : :
20 : : #include "access/twophase_rmgr.h"
21 : : #include "access/xact.h"
22 : : #include "catalog/catalog.h"
23 : : #include "utils/memutils.h"
24 : : #include "utils/pgstat_internal.h"
25 : : #include "utils/rel.h"
26 : : #include "utils/timestamp.h"
27 : :
28 : :
29 : : /* Record that's written to 2PC state file when pgstat state is persisted */
30 : : typedef struct TwoPhasePgStatRecord
31 : : {
32 : : PgStat_Counter tuples_inserted; /* tuples inserted in xact */
33 : : PgStat_Counter tuples_updated; /* tuples updated in xact */
34 : : PgStat_Counter tuples_deleted; /* tuples deleted in xact */
35 : : /* tuples i/u/d prior to truncate/drop */
36 : : PgStat_Counter inserted_pre_truncdrop;
37 : : PgStat_Counter updated_pre_truncdrop;
38 : : PgStat_Counter deleted_pre_truncdrop;
39 : : Oid id; /* table's OID */
40 : : bool shared; /* is it a shared catalog? */
41 : : bool truncdropped; /* was the relation truncated/dropped? */
42 : : } TwoPhasePgStatRecord;
43 : :
44 : :
45 : : static PgStat_TableStatus *pgstat_prep_relation_pending(Oid rel_id, bool isshared);
46 : : static void add_tabstat_xact_level(PgStat_TableStatus *pgstat_info, int nest_level);
47 : : static void ensure_tabstat_xact_level(PgStat_TableStatus *pgstat_info);
48 : : static void save_truncdrop_counters(PgStat_TableXactStatus *trans, bool is_drop);
49 : : static void restore_truncdrop_counters(PgStat_TableXactStatus *trans);
50 : :
51 : :
52 : : /*
53 : : * Copy stats between relations. This is used for things like REINDEX
54 : : * CONCURRENTLY.
55 : : */
56 : : void
57 : 48 : pgstat_copy_relation_stats(Relation dst, Relation src)
58 : : {
59 : 48 : PgStat_StatTabEntry *srcstats;
60 : 48 : PgStatShared_Relation *dstshstats;
61 : 48 : PgStat_EntryRef *dst_ref;
62 : :
63 : 96 : srcstats = pgstat_fetch_stat_tabentry_ext(src->rd_rel->relisshared,
64 : 48 : RelationGetRelid(src));
65 [ + + ]: 48 : if (!srcstats)
66 : 36 : return;
67 : :
68 : 12 : dst_ref = pgstat_get_entry_ref_locked(PGSTAT_KIND_RELATION,
69 [ - + ]: 12 : dst->rd_rel->relisshared ? InvalidOid : MyDatabaseId,
70 : 12 : RelationGetRelid(dst),
71 : : false);
72 : :
73 : 12 : dstshstats = (PgStatShared_Relation *) dst_ref->shared_stats;
74 : 12 : dstshstats->stats = *srcstats;
75 : :
76 : 12 : pgstat_unlock_entry(dst_ref);
77 [ - + ]: 48 : }
78 : :
79 : : /*
80 : : * Initialize a relcache entry to count access statistics. Called whenever a
81 : : * relation is opened.
82 : : *
83 : : * We assume that a relcache entry's pgstat_info field is zeroed by relcache.c
84 : : * when the relcache entry is made; thereafter it is long-lived data.
85 : : *
86 : : * This does not create a reference to a stats entry in shared memory, nor
87 : : * allocate memory for the pending stats. That happens in
88 : : * pgstat_assoc_relation().
89 : : */
90 : : void
91 : 3603690 : pgstat_init_relation(Relation rel)
92 : : {
93 : 3603690 : char relkind = rel->rd_rel->relkind;
94 : :
95 : : /*
96 : : * We only count stats for relations with storage and partitioned tables
97 : : */
98 [ + + + + : 3603690 : if (!RELKIND_HAS_STORAGE(relkind) && relkind != RELKIND_PARTITIONED_TABLE)
+ + + + +
+ + + ]
99 : : {
100 : 11416 : rel->pgstat_enabled = false;
101 : 11416 : rel->pgstat_info = NULL;
102 : 11416 : return;
103 : : }
104 : :
105 [ + - ]: 3592274 : if (!pgstat_track_counts)
106 : : {
107 [ # # ]: 0 : if (rel->pgstat_info)
108 : 0 : pgstat_unlink_relation(rel);
109 : :
110 : : /* We're not counting at all */
111 : 0 : rel->pgstat_enabled = false;
112 : 0 : rel->pgstat_info = NULL;
113 : 0 : return;
114 : : }
115 : :
116 : 3592274 : rel->pgstat_enabled = true;
117 [ - + ]: 3603690 : }
118 : :
119 : : /*
120 : : * Prepare for statistics for this relation to be collected.
121 : : *
122 : : * This ensures we have a reference to the stats entry before stats can be
123 : : * generated. That is important because a relation drop in another connection
124 : : * could otherwise lead to the stats entry being dropped, which then later
125 : : * would get recreated when flushing stats.
126 : : *
127 : : * This is separate from pgstat_init_relation() as it is not uncommon for
128 : : * relcache entries to be opened without ever getting stats reported.
129 : : */
130 : : void
131 : 64282 : pgstat_assoc_relation(Relation rel)
132 : : {
133 [ + - ]: 64282 : Assert(rel->pgstat_enabled);
134 [ + - ]: 64282 : Assert(rel->pgstat_info == NULL);
135 : :
136 : : /* Else find or make the PgStat_TableStatus entry, and update link */
137 : 128564 : rel->pgstat_info = pgstat_prep_relation_pending(RelationGetRelid(rel),
138 : 64282 : rel->rd_rel->relisshared);
139 : :
140 : : /* don't allow link a stats to multiple relcache entries */
141 [ + - ]: 64282 : Assert(rel->pgstat_info->relation == NULL);
142 : :
143 : : /* mark this relation as the owner */
144 : 64282 : rel->pgstat_info->relation = rel;
145 : 64282 : }
146 : :
147 : : /*
148 : : * Break the mutual link between a relcache entry and pending stats entry.
149 : : * This must be called whenever one end of the link is removed.
150 : : */
151 : : void
152 : 178698 : pgstat_unlink_relation(Relation rel)
153 : : {
154 : : /* remove the link to stats info if any */
155 [ + + ]: 178698 : if (rel->pgstat_info == NULL)
156 : 114416 : return;
157 : :
158 : : /* link sanity check */
159 [ + - ]: 64282 : Assert(rel->pgstat_info->relation == rel);
160 : 64282 : rel->pgstat_info->relation = NULL;
161 : 64282 : rel->pgstat_info = NULL;
162 : 178698 : }
163 : :
164 : : /*
165 : : * Ensure that stats are dropped if transaction aborts.
166 : : */
167 : : void
168 : 11063 : pgstat_create_relation(Relation rel)
169 : : {
170 : 11063 : pgstat_create_transactional(PGSTAT_KIND_RELATION,
171 [ + + ]: 11063 : rel->rd_rel->relisshared ? InvalidOid : MyDatabaseId,
172 : 11063 : RelationGetRelid(rel));
173 : 11063 : }
174 : :
175 : : /*
176 : : * Ensure that stats are dropped if transaction commits.
177 : : */
178 : : void
179 : 8296 : pgstat_drop_relation(Relation rel)
180 : : {
181 : 8296 : int nest_level = GetCurrentTransactionNestLevel();
182 : 8296 : PgStat_TableStatus *pgstat_info;
183 : :
184 : 8296 : pgstat_drop_transactional(PGSTAT_KIND_RELATION,
185 [ - + ]: 8296 : rel->rd_rel->relisshared ? InvalidOid : MyDatabaseId,
186 : 8296 : RelationGetRelid(rel));
187 : :
188 [ + + + + : 8296 : if (!pgstat_should_count_relation(rel))
+ + ]
189 : 699 : return;
190 : :
191 : : /*
192 : : * Transactionally set counters to 0. That ensures that accesses to
193 : : * pg_stat_xact_all_tables inside the transaction show 0.
194 : : */
195 : 7597 : pgstat_info = rel->pgstat_info;
196 [ + + + + ]: 7597 : if (pgstat_info->trans &&
197 : 184 : pgstat_info->trans->nest_level == nest_level)
198 : : {
199 : 183 : save_truncdrop_counters(pgstat_info->trans, true);
200 : 183 : pgstat_info->trans->tuples_inserted = 0;
201 : 183 : pgstat_info->trans->tuples_updated = 0;
202 : 183 : pgstat_info->trans->tuples_deleted = 0;
203 : 183 : }
204 [ - + ]: 8296 : }
205 : :
206 : : /*
207 : : * Report that the table was just vacuumed and flush IO statistics.
208 : : */
209 : : void
210 : 645 : pgstat_report_vacuum(Relation rel, PgStat_Counter livetuples,
211 : : PgStat_Counter deadtuples, TimestampTz starttime)
212 : : {
213 : 645 : PgStat_EntryRef *entry_ref;
214 : 645 : PgStatShared_Relation *shtabentry;
215 : 645 : PgStat_StatTabEntry *tabentry;
216 [ + + ]: 645 : Oid dboid = (rel->rd_rel->relisshared ? InvalidOid : MyDatabaseId);
217 : 645 : TimestampTz ts;
218 : 645 : PgStat_Counter elapsedtime;
219 : :
220 [ + - ]: 645 : if (!pgstat_track_counts)
221 : 0 : return;
222 : :
223 : : /* Store the data in the table's hash table entry. */
224 : 645 : ts = GetCurrentTimestamp();
225 : 645 : elapsedtime = TimestampDifferenceMilliseconds(starttime, ts);
226 : :
227 : : /* block acquiring lock for the same reason as pgstat_report_autovac() */
228 : 1290 : entry_ref = pgstat_get_entry_ref_locked(PGSTAT_KIND_RELATION, dboid,
229 : 645 : RelationGetRelid(rel), false);
230 : :
231 : 645 : shtabentry = (PgStatShared_Relation *) entry_ref->shared_stats;
232 : 645 : tabentry = &shtabentry->stats;
233 : :
234 : 645 : tabentry->live_tuples = livetuples;
235 : 645 : tabentry->dead_tuples = deadtuples;
236 : :
237 : : /*
238 : : * It is quite possible that a non-aggressive VACUUM ended up skipping
239 : : * various pages, however, we'll zero the insert counter here regardless.
240 : : * It's currently used only to track when we need to perform an "insert"
241 : : * autovacuum, which are mainly intended to freeze newly inserted tuples.
242 : : * Zeroing this may just mean we'll not try to vacuum the table again
243 : : * until enough tuples have been inserted to trigger another insert
244 : : * autovacuum. An anti-wraparound autovacuum will catch any persistent
245 : : * stragglers.
246 : : */
247 : 645 : tabentry->ins_since_vacuum = 0;
248 : :
249 [ - + ]: 645 : if (AmAutoVacuumWorkerProcess())
250 : : {
251 : 0 : tabentry->last_autovacuum_time = ts;
252 : 0 : tabentry->autovacuum_count++;
253 : 0 : tabentry->total_autovacuum_time += elapsedtime;
254 : 0 : }
255 : : else
256 : : {
257 : 645 : tabentry->last_vacuum_time = ts;
258 : 645 : tabentry->vacuum_count++;
259 : 645 : tabentry->total_vacuum_time += elapsedtime;
260 : : }
261 : :
262 : 645 : pgstat_unlock_entry(entry_ref);
263 : :
264 : : /*
265 : : * Flush IO statistics now. pgstat_report_stat() will flush IO stats,
266 : : * however this will not be called until after an entire autovacuum cycle
267 : : * is done -- which will likely vacuum many relations -- or until the
268 : : * VACUUM command has processed all tables and committed.
269 : : */
270 : 645 : pgstat_flush_io(false);
271 : 645 : (void) pgstat_flush_backend(false, PGSTAT_BACKEND_FLUSH_IO);
272 [ - + ]: 645 : }
273 : :
274 : : /*
275 : : * Report that the table was just analyzed and flush IO statistics.
276 : : *
277 : : * Caller must provide new live- and dead-tuples estimates, as well as a
278 : : * flag indicating whether to reset the mod_since_analyze counter.
279 : : */
280 : : void
281 : 775 : pgstat_report_analyze(Relation rel,
282 : : PgStat_Counter livetuples, PgStat_Counter deadtuples,
283 : : bool resetcounter, TimestampTz starttime)
284 : : {
285 : 775 : PgStat_EntryRef *entry_ref;
286 : 775 : PgStatShared_Relation *shtabentry;
287 : 775 : PgStat_StatTabEntry *tabentry;
288 [ + + ]: 775 : Oid dboid = (rel->rd_rel->relisshared ? InvalidOid : MyDatabaseId);
289 : 775 : TimestampTz ts;
290 : 775 : PgStat_Counter elapsedtime;
291 : :
292 [ + - ]: 775 : if (!pgstat_track_counts)
293 : 0 : return;
294 : :
295 : : /*
296 : : * Unlike VACUUM, ANALYZE might be running inside a transaction that has
297 : : * already inserted and/or deleted rows in the target table. ANALYZE will
298 : : * have counted such rows as live or dead respectively. Because we will
299 : : * report our counts of such rows at transaction end, we should subtract
300 : : * off these counts from the update we're making now, else they'll be
301 : : * double-counted after commit. (This approach also ensures that the
302 : : * shared stats entry ends up with the right numbers if we abort instead
303 : : * of committing.)
304 : : *
305 : : * Waste no time on partitioned tables, though.
306 : : */
307 [ + + + + : 775 : if (pgstat_should_count_relation(rel) &&
+ - ]
308 : 652 : rel->rd_rel->relkind != RELKIND_PARTITIONED_TABLE)
309 : : {
310 : 652 : PgStat_TableXactStatus *trans;
311 : :
312 [ + + ]: 674 : for (trans = rel->pgstat_info->trans; trans; trans = trans->upper)
313 : : {
314 : 22 : livetuples -= trans->tuples_inserted - trans->tuples_deleted;
315 : 22 : deadtuples -= trans->tuples_updated + trans->tuples_deleted;
316 : 22 : }
317 : : /* count stuff inserted by already-aborted subxacts, too */
318 : 652 : deadtuples -= rel->pgstat_info->counts.delta_dead_tuples;
319 : : /* Since ANALYZE's counts are estimates, we could have underflowed */
320 [ + + ]: 652 : livetuples = Max(livetuples, 0);
321 [ + + ]: 652 : deadtuples = Max(deadtuples, 0);
322 : 652 : }
323 : :
324 : : /* Store the data in the table's hash table entry. */
325 : 775 : ts = GetCurrentTimestamp();
326 : 775 : elapsedtime = TimestampDifferenceMilliseconds(starttime, ts);
327 : :
328 : : /* block acquiring lock for the same reason as pgstat_report_autovac() */
329 : 1550 : entry_ref = pgstat_get_entry_ref_locked(PGSTAT_KIND_RELATION, dboid,
330 : 775 : RelationGetRelid(rel),
331 : : false);
332 : : /* can't get dropped while accessed */
333 [ + - ]: 775 : Assert(entry_ref != NULL && entry_ref->shared_stats != NULL);
334 : :
335 : 775 : shtabentry = (PgStatShared_Relation *) entry_ref->shared_stats;
336 : 775 : tabentry = &shtabentry->stats;
337 : :
338 : 775 : tabentry->live_tuples = livetuples;
339 : 775 : tabentry->dead_tuples = deadtuples;
340 : :
341 : : /*
342 : : * If commanded, reset mod_since_analyze to zero. This forgets any
343 : : * changes that were committed while the ANALYZE was in progress, but we
344 : : * have no good way to estimate how many of those there were.
345 : : */
346 [ + + ]: 775 : if (resetcounter)
347 : 768 : tabentry->mod_since_analyze = 0;
348 : :
349 [ - + ]: 775 : if (AmAutoVacuumWorkerProcess())
350 : : {
351 : 0 : tabentry->last_autoanalyze_time = ts;
352 : 0 : tabentry->autoanalyze_count++;
353 : 0 : tabentry->total_autoanalyze_time += elapsedtime;
354 : 0 : }
355 : : else
356 : : {
357 : 775 : tabentry->last_analyze_time = ts;
358 : 775 : tabentry->analyze_count++;
359 : 775 : tabentry->total_analyze_time += elapsedtime;
360 : : }
361 : :
362 : 775 : pgstat_unlock_entry(entry_ref);
363 : :
364 : : /* see pgstat_report_vacuum() */
365 : 775 : pgstat_flush_io(false);
366 : 775 : (void) pgstat_flush_backend(false, PGSTAT_BACKEND_FLUSH_IO);
367 [ - + ]: 775 : }
368 : :
369 : : /*
370 : : * count a tuple insertion of n tuples
371 : : */
372 : : void
373 : 1740399 : pgstat_count_heap_insert(Relation rel, PgStat_Counter n)
374 : : {
375 [ + + + + : 1740399 : if (pgstat_should_count_relation(rel))
+ + ]
376 : : {
377 : 1736617 : PgStat_TableStatus *pgstat_info = rel->pgstat_info;
378 : :
379 : 1736617 : ensure_tabstat_xact_level(pgstat_info);
380 : 1736617 : pgstat_info->trans->tuples_inserted += n;
381 : 1736617 : }
382 : 1740399 : }
383 : :
384 : : /*
385 : : * count a tuple update
386 : : */
387 : : void
388 : 24110 : pgstat_count_heap_update(Relation rel, bool hot, bool newpage)
389 : : {
390 [ + + + - ]: 24110 : Assert(!(hot && newpage));
391 : :
392 [ + - + - : 24110 : if (pgstat_should_count_relation(rel))
# # ]
393 : : {
394 : 24110 : PgStat_TableStatus *pgstat_info = rel->pgstat_info;
395 : :
396 : 24110 : ensure_tabstat_xact_level(pgstat_info);
397 : 24110 : pgstat_info->trans->tuples_updated++;
398 : :
399 : : /*
400 : : * tuples_hot_updated and tuples_newpage_updated counters are
401 : : * nontransactional, so just advance them
402 : : */
403 [ + + ]: 24110 : if (hot)
404 : 14631 : pgstat_info->counts.tuples_hot_updated++;
405 [ + + ]: 9479 : else if (newpage)
406 : 6576 : pgstat_info->counts.tuples_newpage_updated++;
407 : 24110 : }
408 : 24110 : }
409 : :
410 : : /*
411 : : * count a tuple deletion
412 : : */
413 : : void
414 : 303820 : pgstat_count_heap_delete(Relation rel)
415 : : {
416 [ + - + - : 303820 : if (pgstat_should_count_relation(rel))
# # ]
417 : : {
418 : 303820 : PgStat_TableStatus *pgstat_info = rel->pgstat_info;
419 : :
420 : 303820 : ensure_tabstat_xact_level(pgstat_info);
421 : 303820 : pgstat_info->trans->tuples_deleted++;
422 : 303820 : }
423 : 303820 : }
424 : :
425 : : /*
426 : : * update tuple counters due to truncate
427 : : */
428 : : void
429 : 460 : pgstat_count_truncate(Relation rel)
430 : : {
431 [ + + + - : 460 : if (pgstat_should_count_relation(rel))
+ - ]
432 : : {
433 : 460 : PgStat_TableStatus *pgstat_info = rel->pgstat_info;
434 : :
435 : 460 : ensure_tabstat_xact_level(pgstat_info);
436 : 460 : save_truncdrop_counters(pgstat_info->trans, false);
437 : 460 : pgstat_info->trans->tuples_inserted = 0;
438 : 460 : pgstat_info->trans->tuples_updated = 0;
439 : 460 : pgstat_info->trans->tuples_deleted = 0;
440 : 460 : }
441 : 460 : }
442 : :
443 : : /*
444 : : * update dead-tuples count
445 : : *
446 : : * The semantics of this are that we are reporting the nontransactional
447 : : * recovery of "delta" dead tuples; so delta_dead_tuples decreases
448 : : * rather than increasing, and the change goes straight into the per-table
449 : : * counter, not into transactional state.
450 : : */
451 : : void
452 : 2210 : pgstat_update_heap_dead_tuples(Relation rel, int delta)
453 : : {
454 [ + - + - : 2210 : if (pgstat_should_count_relation(rel))
# # ]
455 : : {
456 : 2210 : PgStat_TableStatus *pgstat_info = rel->pgstat_info;
457 : :
458 : 2210 : pgstat_info->counts.delta_dead_tuples -= delta;
459 : 2210 : }
460 : 2210 : }
461 : :
462 : : /*
463 : : * Support function for the SQL-callable pgstat* functions. Returns
464 : : * the collected statistics for one table or NULL. NULL doesn't mean
465 : : * that the table doesn't exist, just that there are no statistics, so the
466 : : * caller is better off to report ZERO instead.
467 : : */
468 : : PgStat_StatTabEntry *
469 : 1580 : pgstat_fetch_stat_tabentry(Oid relid)
470 : : {
471 : 1580 : return pgstat_fetch_stat_tabentry_ext(IsSharedRelation(relid), relid);
472 : : }
473 : :
474 : : /*
475 : : * More efficient version of pgstat_fetch_stat_tabentry(), allowing to specify
476 : : * whether the to-be-accessed table is a shared relation or not.
477 : : */
478 : : PgStat_StatTabEntry *
479 : 1749 : pgstat_fetch_stat_tabentry_ext(bool shared, Oid reloid)
480 : : {
481 [ + + ]: 1749 : Oid dboid = (shared ? InvalidOid : MyDatabaseId);
482 : :
483 : 1749 : return (PgStat_StatTabEntry *)
484 : 1749 : pgstat_fetch_entry(PGSTAT_KIND_RELATION, dboid, reloid);
485 : 1749 : }
486 : :
487 : : /*
488 : : * find any existing PgStat_TableStatus entry for rel
489 : : *
490 : : * Find any existing PgStat_TableStatus entry for rel_id in the current
491 : : * database. If not found, try finding from shared tables.
492 : : *
493 : : * If an entry is found, copy it and increment the copy's counters with their
494 : : * subtransaction counterparts, then return the copy. The caller may need to
495 : : * pfree() the copy.
496 : : *
497 : : * If no entry found, return NULL, don't create a new one.
498 : : */
499 : : PgStat_TableStatus *
500 : 8 : find_tabstat_entry(Oid rel_id)
501 : : {
502 : 8 : PgStat_EntryRef *entry_ref;
503 : 8 : PgStat_TableXactStatus *trans;
504 : 8 : PgStat_TableStatus *tabentry = NULL;
505 : 8 : PgStat_TableStatus *tablestatus = NULL;
506 : :
507 : 8 : entry_ref = pgstat_fetch_pending_entry(PGSTAT_KIND_RELATION, MyDatabaseId, rel_id);
508 [ + + ]: 8 : if (!entry_ref)
509 : : {
510 : 2 : entry_ref = pgstat_fetch_pending_entry(PGSTAT_KIND_RELATION, InvalidOid, rel_id);
511 [ - + ]: 2 : if (!entry_ref)
512 : 2 : return tablestatus;
513 : 0 : }
514 : :
515 : 6 : tabentry = (PgStat_TableStatus *) entry_ref->pending;
516 : 6 : tablestatus = palloc_object(PgStat_TableStatus);
517 : 6 : *tablestatus = *tabentry;
518 : :
519 : : /*
520 : : * Reset tablestatus->trans in the copy of PgStat_TableStatus as it may
521 : : * point to a shared memory area. Its data is saved below, so removing it
522 : : * does not matter.
523 : : */
524 : 6 : tablestatus->trans = NULL;
525 : :
526 : : /*
527 : : * Live subtransaction counts are not included yet. This is not a hot
528 : : * code path so reconcile tuples_inserted, tuples_updated and
529 : : * tuples_deleted even if the caller may not be interested in this data.
530 : : */
531 [ + + ]: 14 : for (trans = tabentry->trans; trans != NULL; trans = trans->upper)
532 : : {
533 : 8 : tablestatus->counts.tuples_inserted += trans->tuples_inserted;
534 : 8 : tablestatus->counts.tuples_updated += trans->tuples_updated;
535 : 8 : tablestatus->counts.tuples_deleted += trans->tuples_deleted;
536 : 8 : }
537 : :
538 : 6 : return tablestatus;
539 : 8 : }
540 : :
541 : : /*
542 : : * Perform relation stats specific end-of-transaction work. Helper for
543 : : * AtEOXact_PgStat.
544 : : *
545 : : * Transfer transactional insert/update counts into the base tabstat entries.
546 : : * We don't bother to free any of the transactional state, since it's all in
547 : : * TopTransactionContext and will go away anyway.
548 : : */
549 : : void
550 : 21689 : AtEOXact_PgStat_Relations(PgStat_SubXactStatus *xact_state, bool isCommit)
551 : : {
552 : 21689 : PgStat_TableXactStatus *trans;
553 : :
554 [ + + ]: 90322 : for (trans = xact_state->first; trans != NULL; trans = trans->next)
555 : : {
556 : 68633 : PgStat_TableStatus *tabstat;
557 : :
558 [ + - ]: 68633 : Assert(trans->nest_level == 1);
559 [ - + ]: 68633 : Assert(trans->upper == NULL);
560 : 68633 : tabstat = trans->parent;
561 [ - + ]: 68633 : Assert(tabstat->trans == trans);
562 : : /* restore pre-truncate/drop stats (if any) in case of aborted xact */
563 [ + + ]: 68633 : if (!isCommit)
564 : 3428 : restore_truncdrop_counters(trans);
565 : : /* count attempted actions regardless of commit/abort */
566 : 68633 : tabstat->counts.tuples_inserted += trans->tuples_inserted;
567 : 68633 : tabstat->counts.tuples_updated += trans->tuples_updated;
568 : 68633 : tabstat->counts.tuples_deleted += trans->tuples_deleted;
569 [ + + ]: 68633 : if (isCommit)
570 : : {
571 : 65205 : tabstat->counts.truncdropped = trans->truncdropped;
572 [ + + ]: 65205 : if (trans->truncdropped)
573 : : {
574 : : /* forget live/dead stats seen by backend thus far */
575 : 586 : tabstat->counts.delta_live_tuples = 0;
576 : 586 : tabstat->counts.delta_dead_tuples = 0;
577 : 586 : }
578 : : /* insert adds a live tuple, delete removes one */
579 : 65205 : tabstat->counts.delta_live_tuples +=
580 : 65205 : trans->tuples_inserted - trans->tuples_deleted;
581 : : /* update and delete each create a dead tuple */
582 : 65205 : tabstat->counts.delta_dead_tuples +=
583 : 65205 : trans->tuples_updated + trans->tuples_deleted;
584 : : /* insert, update, delete each count as one change event */
585 : 65205 : tabstat->counts.changed_tuples +=
586 : 130410 : trans->tuples_inserted + trans->tuples_updated +
587 : 65205 : trans->tuples_deleted;
588 : 65205 : }
589 : : else
590 : : {
591 : : /* inserted tuples are dead, deleted tuples are unaffected */
592 : 3428 : tabstat->counts.delta_dead_tuples +=
593 : 3428 : trans->tuples_inserted + trans->tuples_updated;
594 : : /* an aborted xact generates no changed_tuple events */
595 : : }
596 : 68633 : tabstat->trans = NULL;
597 : 68633 : }
598 : 21689 : }
599 : :
600 : : /*
601 : : * Perform relation stats specific end-of-sub-transaction work. Helper for
602 : : * AtEOSubXact_PgStat.
603 : : *
604 : : * Transfer transactional insert/update counts into the next higher
605 : : * subtransaction state.
606 : : */
607 : : void
608 : 200 : AtEOSubXact_PgStat_Relations(PgStat_SubXactStatus *xact_state, bool isCommit, int nestDepth)
609 : : {
610 : 200 : PgStat_TableXactStatus *trans;
611 : 200 : PgStat_TableXactStatus *next_trans;
612 : :
613 [ + + ]: 513 : for (trans = xact_state->first; trans != NULL; trans = next_trans)
614 : : {
615 : 313 : PgStat_TableStatus *tabstat;
616 : :
617 : 313 : next_trans = trans->next;
618 [ + - ]: 313 : Assert(trans->nest_level == nestDepth);
619 : 313 : tabstat = trans->parent;
620 [ + - ]: 313 : Assert(tabstat->trans == trans);
621 : :
622 [ + + ]: 313 : if (isCommit)
623 : : {
624 [ + + + + ]: 79 : if (trans->upper && trans->upper->nest_level == nestDepth - 1)
625 : : {
626 [ + + ]: 23 : if (trans->truncdropped)
627 : : {
628 : : /* propagate the truncate/drop status one level up */
629 : 4 : save_truncdrop_counters(trans->upper, false);
630 : : /* replace upper xact stats with ours */
631 : 4 : trans->upper->tuples_inserted = trans->tuples_inserted;
632 : 4 : trans->upper->tuples_updated = trans->tuples_updated;
633 : 4 : trans->upper->tuples_deleted = trans->tuples_deleted;
634 : 4 : }
635 : : else
636 : : {
637 : 19 : trans->upper->tuples_inserted += trans->tuples_inserted;
638 : 19 : trans->upper->tuples_updated += trans->tuples_updated;
639 : 19 : trans->upper->tuples_deleted += trans->tuples_deleted;
640 : : }
641 : 23 : tabstat->trans = trans->upper;
642 : 23 : pfree(trans);
643 : 23 : }
644 : : else
645 : : {
646 : : /*
647 : : * When there isn't an immediate parent state, we can just
648 : : * reuse the record instead of going through a palloc/pfree
649 : : * pushup (this works since it's all in TopTransactionContext
650 : : * anyway). We have to re-link it into the parent level,
651 : : * though, and that might mean pushing a new entry into the
652 : : * pgStatXactStack.
653 : : */
654 : 56 : PgStat_SubXactStatus *upper_xact_state;
655 : :
656 : 56 : upper_xact_state = pgstat_get_xact_stack_level(nestDepth - 1);
657 : 56 : trans->next = upper_xact_state->first;
658 : 56 : upper_xact_state->first = trans;
659 : 56 : trans->nest_level = nestDepth - 1;
660 : 56 : }
661 : 79 : }
662 : : else
663 : : {
664 : : /*
665 : : * On abort, update top-level tabstat counts, then forget the
666 : : * subtransaction
667 : : */
668 : :
669 : : /* first restore values obliterated by truncate/drop */
670 : 234 : restore_truncdrop_counters(trans);
671 : : /* count attempted actions regardless of commit/abort */
672 : 234 : tabstat->counts.tuples_inserted += trans->tuples_inserted;
673 : 234 : tabstat->counts.tuples_updated += trans->tuples_updated;
674 : 234 : tabstat->counts.tuples_deleted += trans->tuples_deleted;
675 : : /* inserted tuples are dead, deleted tuples are unaffected */
676 : 234 : tabstat->counts.delta_dead_tuples +=
677 : 234 : trans->tuples_inserted + trans->tuples_updated;
678 : 234 : tabstat->trans = trans->upper;
679 : 234 : pfree(trans);
680 : : }
681 : 313 : }
682 : 200 : }
683 : :
684 : : /*
685 : : * Generate 2PC records for all the pending transaction-dependent relation
686 : : * stats.
687 : : */
688 : : void
689 : 0 : AtPrepare_PgStat_Relations(PgStat_SubXactStatus *xact_state)
690 : : {
691 : 0 : PgStat_TableXactStatus *trans;
692 : :
693 [ # # ]: 0 : for (trans = xact_state->first; trans != NULL; trans = trans->next)
694 : : {
695 : 0 : PgStat_TableStatus *tabstat PG_USED_FOR_ASSERTS_ONLY;
696 : 0 : TwoPhasePgStatRecord record;
697 : :
698 [ # # ]: 0 : Assert(trans->nest_level == 1);
699 [ # # ]: 0 : Assert(trans->upper == NULL);
700 : 0 : tabstat = trans->parent;
701 [ # # ]: 0 : Assert(tabstat->trans == trans);
702 : :
703 : 0 : record.tuples_inserted = trans->tuples_inserted;
704 : 0 : record.tuples_updated = trans->tuples_updated;
705 : 0 : record.tuples_deleted = trans->tuples_deleted;
706 : 0 : record.inserted_pre_truncdrop = trans->inserted_pre_truncdrop;
707 : 0 : record.updated_pre_truncdrop = trans->updated_pre_truncdrop;
708 : 0 : record.deleted_pre_truncdrop = trans->deleted_pre_truncdrop;
709 : 0 : record.id = tabstat->id;
710 : 0 : record.shared = tabstat->shared;
711 : 0 : record.truncdropped = trans->truncdropped;
712 : :
713 : 0 : RegisterTwoPhaseRecord(TWOPHASE_RM_PGSTAT_ID, 0,
714 : : &record, sizeof(TwoPhasePgStatRecord));
715 : 0 : }
716 : 0 : }
717 : :
718 : : /*
719 : : * All we need do here is unlink the transaction stats state from the
720 : : * nontransactional state. The nontransactional action counts will be
721 : : * reported to the stats system immediately, while the effects on live and
722 : : * dead tuple counts are preserved in the 2PC state file.
723 : : *
724 : : * Note: AtEOXact_PgStat_Relations is not called during PREPARE.
725 : : */
726 : : void
727 : 0 : PostPrepare_PgStat_Relations(PgStat_SubXactStatus *xact_state)
728 : : {
729 : 0 : PgStat_TableXactStatus *trans;
730 : :
731 [ # # ]: 0 : for (trans = xact_state->first; trans != NULL; trans = trans->next)
732 : : {
733 : 0 : PgStat_TableStatus *tabstat;
734 : :
735 : 0 : tabstat = trans->parent;
736 : 0 : tabstat->trans = NULL;
737 : 0 : }
738 : 0 : }
739 : :
740 : : /*
741 : : * 2PC processing routine for COMMIT PREPARED case.
742 : : *
743 : : * Load the saved counts into our local pgstats state.
744 : : */
745 : : void
746 : 0 : pgstat_twophase_postcommit(FullTransactionId fxid, uint16 info,
747 : : void *recdata, uint32 len)
748 : : {
749 : 0 : TwoPhasePgStatRecord *rec = (TwoPhasePgStatRecord *) recdata;
750 : 0 : PgStat_TableStatus *pgstat_info;
751 : :
752 : : /* Find or create a tabstat entry for the rel */
753 : 0 : pgstat_info = pgstat_prep_relation_pending(rec->id, rec->shared);
754 : :
755 : : /* Same math as in AtEOXact_PgStat, commit case */
756 : 0 : pgstat_info->counts.tuples_inserted += rec->tuples_inserted;
757 : 0 : pgstat_info->counts.tuples_updated += rec->tuples_updated;
758 : 0 : pgstat_info->counts.tuples_deleted += rec->tuples_deleted;
759 : 0 : pgstat_info->counts.truncdropped = rec->truncdropped;
760 [ # # ]: 0 : if (rec->truncdropped)
761 : : {
762 : : /* forget live/dead stats seen by backend thus far */
763 : 0 : pgstat_info->counts.delta_live_tuples = 0;
764 : 0 : pgstat_info->counts.delta_dead_tuples = 0;
765 : 0 : }
766 : 0 : pgstat_info->counts.delta_live_tuples +=
767 : 0 : rec->tuples_inserted - rec->tuples_deleted;
768 : 0 : pgstat_info->counts.delta_dead_tuples +=
769 : 0 : rec->tuples_updated + rec->tuples_deleted;
770 : 0 : pgstat_info->counts.changed_tuples +=
771 : 0 : rec->tuples_inserted + rec->tuples_updated +
772 : 0 : rec->tuples_deleted;
773 : 0 : }
774 : :
775 : : /*
776 : : * 2PC processing routine for ROLLBACK PREPARED case.
777 : : *
778 : : * Load the saved counts into our local pgstats state, but treat them
779 : : * as aborted.
780 : : */
781 : : void
782 : 0 : pgstat_twophase_postabort(FullTransactionId fxid, uint16 info,
783 : : void *recdata, uint32 len)
784 : : {
785 : 0 : TwoPhasePgStatRecord *rec = (TwoPhasePgStatRecord *) recdata;
786 : 0 : PgStat_TableStatus *pgstat_info;
787 : :
788 : : /* Find or create a tabstat entry for the rel */
789 : 0 : pgstat_info = pgstat_prep_relation_pending(rec->id, rec->shared);
790 : :
791 : : /* Same math as in AtEOXact_PgStat, abort case */
792 [ # # ]: 0 : if (rec->truncdropped)
793 : : {
794 : 0 : rec->tuples_inserted = rec->inserted_pre_truncdrop;
795 : 0 : rec->tuples_updated = rec->updated_pre_truncdrop;
796 : 0 : rec->tuples_deleted = rec->deleted_pre_truncdrop;
797 : 0 : }
798 : 0 : pgstat_info->counts.tuples_inserted += rec->tuples_inserted;
799 : 0 : pgstat_info->counts.tuples_updated += rec->tuples_updated;
800 : 0 : pgstat_info->counts.tuples_deleted += rec->tuples_deleted;
801 : 0 : pgstat_info->counts.delta_dead_tuples +=
802 : 0 : rec->tuples_inserted + rec->tuples_updated;
803 : 0 : }
804 : :
805 : : /*
806 : : * Flush out pending stats for the entry
807 : : *
808 : : * If nowait is true and the lock could not be immediately acquired, returns
809 : : * false without flushing the entry. Otherwise returns true.
810 : : *
811 : : * Some of the stats are copied to the corresponding pending database stats
812 : : * entry when successfully flushing.
813 : : */
814 : : bool
815 : 44882 : pgstat_relation_flush_cb(PgStat_EntryRef *entry_ref, bool nowait)
816 : : {
817 : 44882 : Oid dboid;
818 : 44882 : PgStat_TableStatus *lstats; /* pending stats entry */
819 : 44882 : PgStatShared_Relation *shtabstats;
820 : 44882 : PgStat_StatTabEntry *tabentry; /* table entry of shared stats */
821 : 44882 : PgStat_StatDBEntry *dbentry; /* pending database entry */
822 : :
823 : 44882 : dboid = entry_ref->shared_entry->key.dboid;
824 : 44882 : lstats = (PgStat_TableStatus *) entry_ref->pending;
825 : 44882 : shtabstats = (PgStatShared_Relation *) entry_ref->shared_stats;
826 : :
827 : : /*
828 : : * Ignore entries that didn't accumulate any actual counts, such as
829 : : * indexes that were opened by the planner but not used.
830 : : */
831 [ + + ]: 44882 : if (pg_memory_is_all_zeros(&lstats->counts,
832 : : sizeof(struct PgStat_TableCounts)))
833 : 84 : return true;
834 : :
835 [ + - ]: 44798 : if (!pgstat_lock_entry(entry_ref, nowait))
836 : 0 : return false;
837 : :
838 : : /* add the values to the shared entry. */
839 : 44798 : tabentry = &shtabstats->stats;
840 : :
841 : 44798 : tabentry->numscans += lstats->counts.numscans;
842 [ + + ]: 44798 : if (lstats->counts.numscans)
843 : : {
844 : 28204 : TimestampTz t = GetCurrentTransactionStopTimestamp();
845 : :
846 [ + + ]: 28204 : if (t > tabentry->lastscan)
847 : 27719 : tabentry->lastscan = t;
848 : 28204 : }
849 : 44798 : tabentry->tuples_returned += lstats->counts.tuples_returned;
850 : 44798 : tabentry->tuples_fetched += lstats->counts.tuples_fetched;
851 : 44798 : tabentry->tuples_inserted += lstats->counts.tuples_inserted;
852 : 44798 : tabentry->tuples_updated += lstats->counts.tuples_updated;
853 : 44798 : tabentry->tuples_deleted += lstats->counts.tuples_deleted;
854 : 44798 : tabentry->tuples_hot_updated += lstats->counts.tuples_hot_updated;
855 : 44798 : tabentry->tuples_newpage_updated += lstats->counts.tuples_newpage_updated;
856 : :
857 : : /*
858 : : * If table was truncated/dropped, first reset the live/dead counters.
859 : : */
860 [ + + ]: 44798 : if (lstats->counts.truncdropped)
861 : : {
862 : 33 : tabentry->live_tuples = 0;
863 : 33 : tabentry->dead_tuples = 0;
864 : 33 : tabentry->ins_since_vacuum = 0;
865 : 33 : }
866 : :
867 : 44798 : tabentry->live_tuples += lstats->counts.delta_live_tuples;
868 : 44798 : tabentry->dead_tuples += lstats->counts.delta_dead_tuples;
869 : 44798 : tabentry->mod_since_analyze += lstats->counts.changed_tuples;
870 : :
871 : : /*
872 : : * Using tuples_inserted to update ins_since_vacuum does mean that we'll
873 : : * track aborted inserts too. This isn't ideal, but otherwise probably
874 : : * not worth adding an extra field for. It may just amount to autovacuums
875 : : * triggering for inserts more often than they maybe should, which is
876 : : * probably not going to be common enough to be too concerned about here.
877 : : */
878 : 44798 : tabentry->ins_since_vacuum += lstats->counts.tuples_inserted;
879 : :
880 : 44798 : tabentry->blocks_fetched += lstats->counts.blocks_fetched;
881 : 44798 : tabentry->blocks_hit += lstats->counts.blocks_hit;
882 : :
883 : : /* Clamp live_tuples in case of negative delta_live_tuples */
884 [ + + ]: 44798 : tabentry->live_tuples = Max(tabentry->live_tuples, 0);
885 : : /* Likewise for dead_tuples */
886 [ + + ]: 44798 : tabentry->dead_tuples = Max(tabentry->dead_tuples, 0);
887 : :
888 : 44798 : pgstat_unlock_entry(entry_ref);
889 : :
890 : : /* The entry was successfully flushed, add the same to database stats */
891 : 44798 : dbentry = pgstat_prep_database_pending(dboid);
892 : 44798 : dbentry->tuples_returned += lstats->counts.tuples_returned;
893 : 44798 : dbentry->tuples_fetched += lstats->counts.tuples_fetched;
894 : 44798 : dbentry->tuples_inserted += lstats->counts.tuples_inserted;
895 : 44798 : dbentry->tuples_updated += lstats->counts.tuples_updated;
896 : 44798 : dbentry->tuples_deleted += lstats->counts.tuples_deleted;
897 : 44798 : dbentry->blocks_fetched += lstats->counts.blocks_fetched;
898 : 44798 : dbentry->blocks_hit += lstats->counts.blocks_hit;
899 : :
900 : 44798 : return true;
901 : 44882 : }
902 : :
903 : : void
904 : 52647 : pgstat_relation_delete_pending_cb(PgStat_EntryRef *entry_ref)
905 : : {
906 : 52647 : PgStat_TableStatus *pending = (PgStat_TableStatus *) entry_ref->pending;
907 : :
908 [ + + ]: 52647 : if (pending->relation)
909 : 42377 : pgstat_unlink_relation(pending->relation);
910 : 52647 : }
911 : :
912 : : void
913 : 2919 : pgstat_relation_reset_timestamp_cb(PgStatShared_Common *header, TimestampTz ts)
914 : : {
915 : 2919 : ((PgStatShared_Relation *) header)->stats.stat_reset_time = ts;
916 : 2919 : }
917 : :
918 : : /*
919 : : * Find or create a PgStat_TableStatus entry for rel. New entry is created and
920 : : * initialized if not exists.
921 : : */
922 : : static PgStat_TableStatus *
923 : 64282 : pgstat_prep_relation_pending(Oid rel_id, bool isshared)
924 : : {
925 : 64282 : PgStat_EntryRef *entry_ref;
926 : 64282 : PgStat_TableStatus *pending;
927 : :
928 : 64282 : entry_ref = pgstat_prep_pending_entry(PGSTAT_KIND_RELATION,
929 [ + + ]: 64282 : isshared ? InvalidOid : MyDatabaseId,
930 : 64282 : rel_id, NULL);
931 : 64282 : pending = entry_ref->pending;
932 : 64282 : pending->id = rel_id;
933 : 64282 : pending->shared = isshared;
934 : :
935 : 128564 : return pending;
936 : 64282 : }
937 : :
938 : : /*
939 : : * add a new (sub)transaction state record
940 : : */
941 : : static void
942 : 68890 : add_tabstat_xact_level(PgStat_TableStatus *pgstat_info, int nest_level)
943 : : {
944 : 68890 : PgStat_SubXactStatus *xact_state;
945 : 68890 : PgStat_TableXactStatus *trans;
946 : :
947 : : /*
948 : : * If this is the first rel to be modified at the current nest level, we
949 : : * first have to push a transaction stack entry.
950 : : */
951 : 68890 : xact_state = pgstat_get_xact_stack_level(nest_level);
952 : :
953 : : /* Now make a per-table stack entry */
954 : 68890 : trans = (PgStat_TableXactStatus *)
955 : 68890 : MemoryContextAllocZero(TopTransactionContext,
956 : : sizeof(PgStat_TableXactStatus));
957 : 68890 : trans->nest_level = nest_level;
958 : 68890 : trans->upper = pgstat_info->trans;
959 : 68890 : trans->parent = pgstat_info;
960 : 68890 : trans->next = xact_state->first;
961 : 68890 : xact_state->first = trans;
962 : 68890 : pgstat_info->trans = trans;
963 : 68890 : }
964 : :
965 : : /*
966 : : * Add a new (sub)transaction record if needed.
967 : : */
968 : : static void
969 : 2065007 : ensure_tabstat_xact_level(PgStat_TableStatus *pgstat_info)
970 : : {
971 : 2065007 : int nest_level = GetCurrentTransactionNestLevel();
972 : :
973 [ + + + + ]: 2065007 : if (pgstat_info->trans == NULL ||
974 : 1996326 : pgstat_info->trans->nest_level != nest_level)
975 : 68890 : add_tabstat_xact_level(pgstat_info, nest_level);
976 : 2065007 : }
977 : :
978 : : /*
979 : : * Whenever a table is truncated/dropped, we save its i/u/d counters so that
980 : : * they can be cleared, and if the (sub)xact that executed the truncate/drop
981 : : * later aborts, the counters can be restored to the saved (pre-truncate/drop)
982 : : * values.
983 : : *
984 : : * Note that for truncate we do this on the first truncate in any particular
985 : : * subxact level only.
986 : : */
987 : : static void
988 : 647 : save_truncdrop_counters(PgStat_TableXactStatus *trans, bool is_drop)
989 : : {
990 [ + + + + ]: 647 : if (!trans->truncdropped || is_drop)
991 : : {
992 : 644 : trans->inserted_pre_truncdrop = trans->tuples_inserted;
993 : 644 : trans->updated_pre_truncdrop = trans->tuples_updated;
994 : 644 : trans->deleted_pre_truncdrop = trans->tuples_deleted;
995 : 644 : trans->truncdropped = true;
996 : 644 : }
997 : 647 : }
998 : :
999 : : /*
1000 : : * restore counters when a truncate aborts
1001 : : */
1002 : : static void
1003 : 3662 : restore_truncdrop_counters(PgStat_TableXactStatus *trans)
1004 : : {
1005 [ + + ]: 3662 : if (trans->truncdropped)
1006 : : {
1007 : 52 : trans->tuples_inserted = trans->inserted_pre_truncdrop;
1008 : 52 : trans->tuples_updated = trans->updated_pre_truncdrop;
1009 : 52 : trans->tuples_deleted = trans->deleted_pre_truncdrop;
1010 : 52 : }
1011 : 3662 : }
|