Line data Source code
1 : /*
2 : * contrib/pgstattuple/pgstattuple.c
3 : *
4 : * Copyright (c) 2001,2002 Tatsuo Ishii
5 : *
6 : * Permission to use, copy, modify, and distribute this software and
7 : * its documentation for any purpose, without fee, and without a
8 : * written agreement is hereby granted, provided that the above
9 : * copyright notice and this paragraph and the following two
10 : * paragraphs appear in all copies.
11 : *
12 : * IN NO EVENT SHALL THE AUTHOR BE LIABLE TO ANY PARTY FOR DIRECT,
13 : * INDIRECT, SPECIAL, INCIDENTAL, OR CONSEQUENTIAL DAMAGES, INCLUDING
14 : * LOST PROFITS, ARISING OUT OF THE USE OF THIS SOFTWARE AND ITS
15 : * DOCUMENTATION, EVEN IF THE UNIVERSITY OF CALIFORNIA HAS BEEN ADVISED
16 : * OF THE POSSIBILITY OF SUCH DAMAGE.
17 : *
18 : * THE AUTHOR SPECIFICALLY DISCLAIMS ANY WARRANTIES, INCLUDING, BUT NOT
19 : * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
20 : * A PARTICULAR PURPOSE. THE SOFTWARE PROVIDED HEREUNDER IS ON AN "AS
21 : * IS" BASIS, AND THE AUTHOR HAS NO OBLIGATIONS TO PROVIDE MAINTENANCE,
22 : * SUPPORT, UPDATES, ENHANCEMENTS, OR MODIFICATIONS.
23 : */
24 :
25 : #include "postgres.h"
26 :
27 : #include "access/gist_private.h"
28 : #include "access/hash.h"
29 : #include "access/heapam.h"
30 : #include "access/nbtree.h"
31 : #include "access/relscan.h"
32 : #include "access/tableam.h"
33 : #include "catalog/namespace.h"
34 : #include "catalog/pg_am_d.h"
35 : #include "funcapi.h"
36 : #include "miscadmin.h"
37 : #include "storage/bufmgr.h"
38 : #include "storage/lmgr.h"
39 : #include "utils/builtins.h"
40 : #include "utils/varlena.h"
41 :
42 2 : PG_MODULE_MAGIC;
43 :
44 2 : PG_FUNCTION_INFO_V1(pgstattuple);
45 4 : PG_FUNCTION_INFO_V1(pgstattuple_v1_5);
46 2 : PG_FUNCTION_INFO_V1(pgstattuplebyid);
47 4 : PG_FUNCTION_INFO_V1(pgstattuplebyid_v1_5);
48 :
49 : /*
50 : * struct pgstattuple_type
51 : *
52 : * tuple_percent, dead_tuple_percent and free_percent are computable,
53 : * so not defined here.
54 : */
55 : typedef struct pgstattuple_type
56 : {
57 : uint64 table_len;
58 : uint64 tuple_count;
59 : uint64 tuple_len;
60 : uint64 dead_tuple_count;
61 : uint64 dead_tuple_len;
62 : uint64 free_space; /* free/reusable space in bytes */
63 : } pgstattuple_type;
64 :
65 : typedef void (*pgstat_page) (pgstattuple_type *, Relation, BlockNumber,
66 : BufferAccessStrategy);
67 :
68 : static Datum build_pgstattuple_type(pgstattuple_type *stat,
69 : FunctionCallInfo fcinfo);
70 : static Datum pgstat_relation(Relation rel, FunctionCallInfo fcinfo);
71 : static Datum pgstat_heap(Relation rel, FunctionCallInfo fcinfo);
72 : static void pgstat_btree_page(pgstattuple_type *stat,
73 : Relation rel, BlockNumber blkno,
74 : BufferAccessStrategy bstrategy);
75 : static void pgstat_hash_page(pgstattuple_type *stat,
76 : Relation rel, BlockNumber blkno,
77 : BufferAccessStrategy bstrategy);
78 : static void pgstat_gist_page(pgstattuple_type *stat,
79 : Relation rel, BlockNumber blkno,
80 : BufferAccessStrategy bstrategy);
81 : static Datum pgstat_index(Relation rel, BlockNumber start,
82 : pgstat_page pagefn, FunctionCallInfo fcinfo);
83 : static void pgstat_index_page(pgstattuple_type *stat, Page page,
84 : OffsetNumber minoff, OffsetNumber maxoff);
85 :
86 : /*
87 : * build_pgstattuple_type -- build a pgstattuple_type tuple
88 : */
89 : static Datum
90 16 : build_pgstattuple_type(pgstattuple_type *stat, FunctionCallInfo fcinfo)
91 : {
92 : #define NCOLUMNS 9
93 : #define NCHARS 314
94 :
95 : HeapTuple tuple;
96 : char *values[NCOLUMNS];
97 : char values_buf[NCOLUMNS][NCHARS];
98 : int i;
99 : double tuple_percent;
100 : double dead_tuple_percent;
101 : double free_percent; /* free/reusable space in % */
102 : TupleDesc tupdesc;
103 : AttInMetadata *attinmeta;
104 :
105 : /* Build a tuple descriptor for our result type */
106 16 : if (get_call_result_type(fcinfo, NULL, &tupdesc) != TYPEFUNC_COMPOSITE)
107 0 : elog(ERROR, "return type must be a row type");
108 :
109 : /*
110 : * Generate attribute metadata needed later to produce tuples from raw C
111 : * strings
112 : */
113 16 : attinmeta = TupleDescGetAttInMetadata(tupdesc);
114 :
115 16 : if (stat->table_len == 0)
116 : {
117 16 : tuple_percent = 0.0;
118 16 : dead_tuple_percent = 0.0;
119 16 : free_percent = 0.0;
120 : }
121 : else
122 : {
123 0 : tuple_percent = 100.0 * stat->tuple_len / stat->table_len;
124 0 : dead_tuple_percent = 100.0 * stat->dead_tuple_len / stat->table_len;
125 0 : free_percent = 100.0 * stat->free_space / stat->table_len;
126 : }
127 :
128 : /*
129 : * Prepare a values array for constructing the tuple. This should be an
130 : * array of C strings which will be processed later by the appropriate
131 : * "in" functions.
132 : */
133 160 : for (i = 0; i < NCOLUMNS; i++)
134 144 : values[i] = values_buf[i];
135 16 : i = 0;
136 16 : snprintf(values[i++], NCHARS, INT64_FORMAT, stat->table_len);
137 16 : snprintf(values[i++], NCHARS, INT64_FORMAT, stat->tuple_count);
138 16 : snprintf(values[i++], NCHARS, INT64_FORMAT, stat->tuple_len);
139 16 : snprintf(values[i++], NCHARS, "%.2f", tuple_percent);
140 16 : snprintf(values[i++], NCHARS, INT64_FORMAT, stat->dead_tuple_count);
141 16 : snprintf(values[i++], NCHARS, INT64_FORMAT, stat->dead_tuple_len);
142 16 : snprintf(values[i++], NCHARS, "%.2f", dead_tuple_percent);
143 16 : snprintf(values[i++], NCHARS, INT64_FORMAT, stat->free_space);
144 16 : snprintf(values[i++], NCHARS, "%.2f", free_percent);
145 :
146 : /* build a tuple */
147 16 : tuple = BuildTupleFromCStrings(attinmeta, values);
148 :
149 : /* make the tuple into a datum */
150 16 : return HeapTupleGetDatum(tuple);
151 : }
152 :
153 : /* ----------
154 : * pgstattuple:
155 : * returns live/dead tuples info
156 : *
157 : * C FUNCTION definition
158 : * pgstattuple(text) returns pgstattuple_type
159 : *
160 : * The superuser() check here must be kept as the library might be upgraded
161 : * without the extension being upgraded, meaning that in pre-1.5 installations
162 : * these functions could be called by any user.
163 : * ----------
164 : */
165 :
166 : Datum
167 0 : pgstattuple(PG_FUNCTION_ARGS)
168 : {
169 0 : text *relname = PG_GETARG_TEXT_PP(0);
170 : RangeVar *relrv;
171 : Relation rel;
172 :
173 0 : if (!superuser())
174 0 : ereport(ERROR,
175 : (errcode(ERRCODE_INSUFFICIENT_PRIVILEGE),
176 : errmsg("must be superuser to use pgstattuple functions")));
177 :
178 : /* open relation */
179 0 : relrv = makeRangeVarFromNameList(textToQualifiedNameList(relname));
180 0 : rel = relation_openrv(relrv, AccessShareLock);
181 :
182 0 : PG_RETURN_DATUM(pgstat_relation(rel, fcinfo));
183 : }
184 :
185 : /*
186 : * As of pgstattuple version 1.5, we no longer need to check if the user
187 : * is a superuser because we REVOKE EXECUTE on the function from PUBLIC.
188 : * Users can then grant access to it based on their policies.
189 : *
190 : * Otherwise identical to pgstattuple (above).
191 : */
192 : Datum
193 18 : pgstattuple_v1_5(PG_FUNCTION_ARGS)
194 : {
195 18 : text *relname = PG_GETARG_TEXT_PP(0);
196 : RangeVar *relrv;
197 : Relation rel;
198 :
199 : /* open relation */
200 18 : relrv = makeRangeVarFromNameList(textToQualifiedNameList(relname));
201 18 : rel = relation_openrv(relrv, AccessShareLock);
202 :
203 18 : PG_RETURN_DATUM(pgstat_relation(rel, fcinfo));
204 : }
205 :
206 : /* Must keep superuser() check, see above. */
207 : Datum
208 0 : pgstattuplebyid(PG_FUNCTION_ARGS)
209 : {
210 0 : Oid relid = PG_GETARG_OID(0);
211 : Relation rel;
212 :
213 0 : if (!superuser())
214 0 : ereport(ERROR,
215 : (errcode(ERRCODE_INSUFFICIENT_PRIVILEGE),
216 : errmsg("must be superuser to use pgstattuple functions")));
217 :
218 : /* open relation */
219 0 : rel = relation_open(relid, AccessShareLock);
220 :
221 0 : PG_RETURN_DATUM(pgstat_relation(rel, fcinfo));
222 : }
223 :
224 : /* Remove superuser() check for 1.5 version, see above */
225 : Datum
226 6 : pgstattuplebyid_v1_5(PG_FUNCTION_ARGS)
227 : {
228 6 : Oid relid = PG_GETARG_OID(0);
229 : Relation rel;
230 :
231 : /* open relation */
232 6 : rel = relation_open(relid, AccessShareLock);
233 :
234 6 : PG_RETURN_DATUM(pgstat_relation(rel, fcinfo));
235 : }
236 :
237 : /*
238 : * pgstat_relation
239 : */
240 : static Datum
241 24 : pgstat_relation(Relation rel, FunctionCallInfo fcinfo)
242 : {
243 : const char *err;
244 :
245 : /*
246 : * Reject attempts to read non-local temporary relations; we would be
247 : * likely to get wrong data since we have no visibility into the owning
248 : * session's local buffers.
249 : */
250 24 : if (RELATION_IS_OTHER_TEMP(rel))
251 0 : ereport(ERROR,
252 : (errcode(ERRCODE_FEATURE_NOT_SUPPORTED),
253 : errmsg("cannot access temporary tables of other sessions")));
254 :
255 24 : if (RELKIND_HAS_TABLE_AM(rel->rd_rel->relkind) ||
256 8 : rel->rd_rel->relkind == RELKIND_SEQUENCE)
257 : {
258 16 : return pgstat_heap(rel, fcinfo);
259 : }
260 8 : else if (rel->rd_rel->relkind == RELKIND_INDEX)
261 : {
262 : /* see pgstatindex_impl */
263 0 : if (!rel->rd_index->indisvalid)
264 0 : ereport(ERROR,
265 : (errcode(ERRCODE_OBJECT_NOT_IN_PREREQUISITE_STATE),
266 : errmsg("index \"%s\" is not valid",
267 : RelationGetRelationName(rel))));
268 :
269 0 : switch (rel->rd_rel->relam)
270 : {
271 0 : case BTREE_AM_OID:
272 0 : return pgstat_index(rel, BTREE_METAPAGE + 1,
273 : pgstat_btree_page, fcinfo);
274 0 : case HASH_AM_OID:
275 0 : return pgstat_index(rel, HASH_METAPAGE + 1,
276 : pgstat_hash_page, fcinfo);
277 0 : case GIST_AM_OID:
278 0 : return pgstat_index(rel, GIST_ROOT_BLKNO + 1,
279 : pgstat_gist_page, fcinfo);
280 0 : case GIN_AM_OID:
281 0 : err = "gin index";
282 0 : break;
283 0 : case SPGIST_AM_OID:
284 0 : err = "spgist index";
285 0 : break;
286 0 : case BRIN_AM_OID:
287 0 : err = "brin index";
288 0 : break;
289 0 : default:
290 0 : err = "unknown index";
291 0 : break;
292 : }
293 0 : ereport(ERROR,
294 : (errcode(ERRCODE_FEATURE_NOT_SUPPORTED),
295 : errmsg("index \"%s\" (%s) is not supported",
296 : RelationGetRelationName(rel), err)));
297 : }
298 : else
299 : {
300 8 : ereport(ERROR,
301 : (errcode(ERRCODE_FEATURE_NOT_SUPPORTED),
302 : errmsg("cannot get tuple-level statistics for relation \"%s\"",
303 : RelationGetRelationName(rel)),
304 : errdetail_relkind_not_supported(rel->rd_rel->relkind)));
305 : }
306 :
307 : return 0; /* should not happen */
308 : }
309 :
310 : /*
311 : * pgstat_heap -- returns live/dead tuples info in a heap
312 : */
313 : static Datum
314 16 : pgstat_heap(Relation rel, FunctionCallInfo fcinfo)
315 : {
316 : TableScanDesc scan;
317 : HeapScanDesc hscan;
318 : HeapTuple tuple;
319 : BlockNumber nblocks;
320 16 : BlockNumber block = 0; /* next block to count free space in */
321 : BlockNumber tupblock;
322 : Buffer buffer;
323 16 : pgstattuple_type stat = {0};
324 : SnapshotData SnapshotDirty;
325 :
326 16 : if (rel->rd_rel->relam != HEAP_TABLE_AM_OID)
327 0 : ereport(ERROR,
328 : (errcode(ERRCODE_FEATURE_NOT_SUPPORTED),
329 : errmsg("only heap AM is supported")));
330 :
331 : /* Disable syncscan because we assume we scan from block zero upwards */
332 16 : scan = table_beginscan_strat(rel, SnapshotAny, 0, NULL, true, false);
333 16 : hscan = (HeapScanDesc) scan;
334 :
335 16 : InitDirtySnapshot(SnapshotDirty);
336 :
337 16 : nblocks = hscan->rs_nblocks; /* # blocks to be scanned */
338 :
339 : /* scan the relation */
340 16 : while ((tuple = heap_getnext(scan, ForwardScanDirection)) != NULL)
341 : {
342 0 : CHECK_FOR_INTERRUPTS();
343 :
344 : /* must hold a buffer lock to call HeapTupleSatisfiesVisibility */
345 0 : LockBuffer(hscan->rs_cbuf, BUFFER_LOCK_SHARE);
346 :
347 0 : if (HeapTupleSatisfiesVisibility(tuple, &SnapshotDirty, hscan->rs_cbuf))
348 : {
349 0 : stat.tuple_len += tuple->t_len;
350 0 : stat.tuple_count++;
351 : }
352 : else
353 : {
354 0 : stat.dead_tuple_len += tuple->t_len;
355 0 : stat.dead_tuple_count++;
356 : }
357 :
358 0 : LockBuffer(hscan->rs_cbuf, BUFFER_LOCK_UNLOCK);
359 :
360 : /*
361 : * To avoid physically reading the table twice, try to do the
362 : * free-space scan in parallel with the heap scan. However,
363 : * heap_getnext may find no tuples on a given page, so we cannot
364 : * simply examine the pages returned by the heap scan.
365 : */
366 0 : tupblock = ItemPointerGetBlockNumber(&tuple->t_self);
367 :
368 0 : while (block <= tupblock)
369 : {
370 0 : CHECK_FOR_INTERRUPTS();
371 :
372 0 : buffer = ReadBufferExtended(rel, MAIN_FORKNUM, block,
373 : RBM_NORMAL, hscan->rs_strategy);
374 0 : LockBuffer(buffer, BUFFER_LOCK_SHARE);
375 0 : stat.free_space += PageGetHeapFreeSpace((Page) BufferGetPage(buffer));
376 0 : UnlockReleaseBuffer(buffer);
377 0 : block++;
378 : }
379 : }
380 :
381 16 : while (block < nblocks)
382 : {
383 0 : CHECK_FOR_INTERRUPTS();
384 :
385 0 : buffer = ReadBufferExtended(rel, MAIN_FORKNUM, block,
386 : RBM_NORMAL, hscan->rs_strategy);
387 0 : LockBuffer(buffer, BUFFER_LOCK_SHARE);
388 0 : stat.free_space += PageGetHeapFreeSpace((Page) BufferGetPage(buffer));
389 0 : UnlockReleaseBuffer(buffer);
390 0 : block++;
391 : }
392 :
393 16 : table_endscan(scan);
394 16 : relation_close(rel, AccessShareLock);
395 :
396 16 : stat.table_len = (uint64) nblocks * BLCKSZ;
397 :
398 16 : return build_pgstattuple_type(&stat, fcinfo);
399 : }
400 :
401 : /*
402 : * pgstat_btree_page -- check tuples in a btree page
403 : */
404 : static void
405 0 : pgstat_btree_page(pgstattuple_type *stat, Relation rel, BlockNumber blkno,
406 : BufferAccessStrategy bstrategy)
407 : {
408 : Buffer buf;
409 : Page page;
410 :
411 0 : buf = ReadBufferExtended(rel, MAIN_FORKNUM, blkno, RBM_NORMAL, bstrategy);
412 0 : LockBuffer(buf, BT_READ);
413 0 : page = BufferGetPage(buf);
414 :
415 : /* Page is valid, see what to do with it */
416 0 : if (PageIsNew(page))
417 : {
418 : /* fully empty page */
419 0 : stat->free_space += BLCKSZ;
420 : }
421 : else
422 : {
423 : BTPageOpaque opaque;
424 :
425 0 : opaque = BTPageGetOpaque(page);
426 0 : if (P_IGNORE(opaque))
427 : {
428 : /* deleted or half-dead page */
429 0 : stat->free_space += BLCKSZ;
430 : }
431 0 : else if (P_ISLEAF(opaque))
432 : {
433 0 : pgstat_index_page(stat, page, P_FIRSTDATAKEY(opaque),
434 0 : PageGetMaxOffsetNumber(page));
435 : }
436 : else
437 : {
438 : /* internal page */
439 : }
440 : }
441 :
442 0 : _bt_relbuf(rel, buf);
443 0 : }
444 :
445 : /*
446 : * pgstat_hash_page -- check tuples in a hash page
447 : */
448 : static void
449 0 : pgstat_hash_page(pgstattuple_type *stat, Relation rel, BlockNumber blkno,
450 : BufferAccessStrategy bstrategy)
451 : {
452 : Buffer buf;
453 : Page page;
454 :
455 0 : buf = _hash_getbuf_with_strategy(rel, blkno, HASH_READ, 0, bstrategy);
456 0 : page = BufferGetPage(buf);
457 :
458 0 : if (PageGetSpecialSize(page) == MAXALIGN(sizeof(HashPageOpaqueData)))
459 : {
460 : HashPageOpaque opaque;
461 :
462 0 : opaque = HashPageGetOpaque(page);
463 0 : switch (opaque->hasho_flag & LH_PAGE_TYPE)
464 : {
465 0 : case LH_UNUSED_PAGE:
466 0 : stat->free_space += BLCKSZ;
467 0 : break;
468 0 : case LH_BUCKET_PAGE:
469 : case LH_OVERFLOW_PAGE:
470 0 : pgstat_index_page(stat, page, FirstOffsetNumber,
471 0 : PageGetMaxOffsetNumber(page));
472 0 : break;
473 0 : case LH_BITMAP_PAGE:
474 : case LH_META_PAGE:
475 : default:
476 0 : break;
477 : }
478 : }
479 : else
480 : {
481 : /* maybe corrupted */
482 : }
483 :
484 0 : _hash_relbuf(rel, buf);
485 0 : }
486 :
487 : /*
488 : * pgstat_gist_page -- check tuples in a gist page
489 : */
490 : static void
491 0 : pgstat_gist_page(pgstattuple_type *stat, Relation rel, BlockNumber blkno,
492 : BufferAccessStrategy bstrategy)
493 : {
494 : Buffer buf;
495 : Page page;
496 :
497 0 : buf = ReadBufferExtended(rel, MAIN_FORKNUM, blkno, RBM_NORMAL, bstrategy);
498 0 : LockBuffer(buf, GIST_SHARE);
499 0 : gistcheckpage(rel, buf);
500 0 : page = BufferGetPage(buf);
501 :
502 0 : if (GistPageIsLeaf(page))
503 : {
504 0 : pgstat_index_page(stat, page, FirstOffsetNumber,
505 0 : PageGetMaxOffsetNumber(page));
506 : }
507 : else
508 : {
509 : /* root or node */
510 : }
511 :
512 0 : UnlockReleaseBuffer(buf);
513 0 : }
514 :
515 : /*
516 : * pgstat_index -- returns live/dead tuples info in a generic index
517 : */
518 : static Datum
519 0 : pgstat_index(Relation rel, BlockNumber start, pgstat_page pagefn,
520 : FunctionCallInfo fcinfo)
521 : {
522 : BlockNumber nblocks;
523 : BlockNumber blkno;
524 : BufferAccessStrategy bstrategy;
525 0 : pgstattuple_type stat = {0};
526 :
527 : /* prepare access strategy for this index */
528 0 : bstrategy = GetAccessStrategy(BAS_BULKREAD);
529 :
530 0 : blkno = start;
531 : for (;;)
532 : {
533 : /* Get the current relation length */
534 0 : LockRelationForExtension(rel, ExclusiveLock);
535 0 : nblocks = RelationGetNumberOfBlocks(rel);
536 0 : UnlockRelationForExtension(rel, ExclusiveLock);
537 :
538 : /* Quit if we've scanned the whole relation */
539 0 : if (blkno >= nblocks)
540 : {
541 0 : stat.table_len = (uint64) nblocks * BLCKSZ;
542 :
543 0 : break;
544 : }
545 :
546 0 : for (; blkno < nblocks; blkno++)
547 : {
548 0 : CHECK_FOR_INTERRUPTS();
549 :
550 0 : pagefn(&stat, rel, blkno, bstrategy);
551 : }
552 : }
553 :
554 0 : relation_close(rel, AccessShareLock);
555 :
556 0 : return build_pgstattuple_type(&stat, fcinfo);
557 : }
558 :
559 : /*
560 : * pgstat_index_page -- for generic index page
561 : */
562 : static void
563 0 : pgstat_index_page(pgstattuple_type *stat, Page page,
564 : OffsetNumber minoff, OffsetNumber maxoff)
565 : {
566 : OffsetNumber i;
567 :
568 0 : stat->free_space += PageGetFreeSpace(page);
569 :
570 0 : for (i = minoff; i <= maxoff; i = OffsetNumberNext(i))
571 : {
572 0 : ItemId itemid = PageGetItemId(page, i);
573 :
574 0 : if (ItemIdIsDead(itemid))
575 : {
576 0 : stat->dead_tuple_count++;
577 0 : stat->dead_tuple_len += ItemIdGetLength(itemid);
578 : }
579 : else
580 : {
581 0 : stat->tuple_count++;
582 0 : stat->tuple_len += ItemIdGetLength(itemid);
583 : }
584 : }
585 0 : }
|