2007-05-18 03:11:25 +08:00
|
|
|
/*-------------------------------------------------------------------------
|
|
|
|
*
|
|
|
|
* rawpage.c
|
|
|
|
* Functions to extract a raw page as bytea and inspect it
|
|
|
|
*
|
|
|
|
* Access-method specific inspection functions are in separate files.
|
|
|
|
*
|
2021-01-03 02:06:25 +08:00
|
|
|
* Copyright (c) 2007-2021, PostgreSQL Global Development Group
|
2007-05-18 03:11:25 +08:00
|
|
|
*
|
|
|
|
* IDENTIFICATION
|
2010-09-21 04:08:53 +08:00
|
|
|
* contrib/pageinspect/rawpage.c
|
2007-05-18 03:11:25 +08:00
|
|
|
*
|
|
|
|
*-------------------------------------------------------------------------
|
|
|
|
*/
|
|
|
|
|
|
|
|
#include "postgres.h"
|
|
|
|
|
2012-08-31 04:15:44 +08:00
|
|
|
#include "access/htup_details.h"
|
2019-01-22 02:18:20 +08:00
|
|
|
#include "access/relation.h"
|
2007-05-18 03:11:25 +08:00
|
|
|
#include "catalog/namespace.h"
|
2014-03-03 20:14:31 +08:00
|
|
|
#include "catalog/pg_type.h"
|
2008-05-12 08:00:54 +08:00
|
|
|
#include "funcapi.h"
|
2007-05-18 03:11:25 +08:00
|
|
|
#include "miscadmin.h"
|
2019-10-23 11:56:22 +08:00
|
|
|
#include "pageinspect.h"
|
2008-05-12 08:00:54 +08:00
|
|
|
#include "storage/bufmgr.h"
|
2017-03-17 21:49:10 +08:00
|
|
|
#include "storage/checksum.h"
|
2008-05-12 08:00:54 +08:00
|
|
|
#include "utils/builtins.h"
|
2014-03-03 20:14:31 +08:00
|
|
|
#include "utils/pg_lsn.h"
|
2011-02-24 01:18:09 +08:00
|
|
|
#include "utils/rel.h"
|
2017-01-21 09:29:53 +08:00
|
|
|
#include "utils/varlena.h"
|
2007-05-18 03:11:25 +08:00
|
|
|
|
|
|
|
PG_MODULE_MAGIC;
|
|
|
|
|
2009-06-09 00:22:44 +08:00
|
|
|
static bytea *get_raw_page_internal(text *relname, ForkNumber forknum,
|
2019-05-23 01:04:48 +08:00
|
|
|
BlockNumber blkno);
|
2009-06-09 00:22:44 +08:00
|
|
|
|
|
|
|
|
2007-05-18 03:11:25 +08:00
|
|
|
/*
|
|
|
|
* get_raw_page
|
|
|
|
*
|
|
|
|
* Returns a copy of a page from shared buffers as a bytea
|
|
|
|
*/
|
|
|
|
PG_FUNCTION_INFO_V1(get_raw_page);
|
|
|
|
|
|
|
|
Datum
|
|
|
|
get_raw_page(PG_FUNCTION_ARGS)
|
2009-06-09 00:22:44 +08:00
|
|
|
{
|
2017-03-13 07:35:34 +08:00
|
|
|
text *relname = PG_GETARG_TEXT_PP(0);
|
2009-06-09 00:22:44 +08:00
|
|
|
uint32 blkno = PG_GETARG_UINT32(1);
|
|
|
|
bytea *raw_page;
|
|
|
|
|
|
|
|
/*
|
|
|
|
* We don't normally bother to check the number of arguments to a C
|
|
|
|
* function, but here it's needed for safety because early 8.4 beta
|
|
|
|
* releases mistakenly redefined get_raw_page() as taking three arguments.
|
|
|
|
*/
|
|
|
|
if (PG_NARGS() != 2)
|
|
|
|
ereport(ERROR,
|
|
|
|
(errmsg("wrong number of arguments to get_raw_page()"),
|
|
|
|
errhint("Run the updated pageinspect.sql script.")));
|
|
|
|
|
|
|
|
raw_page = get_raw_page_internal(relname, MAIN_FORKNUM, blkno);
|
|
|
|
|
|
|
|
PG_RETURN_BYTEA_P(raw_page);
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* get_raw_page_fork
|
|
|
|
*
|
|
|
|
* Same, for any fork
|
|
|
|
*/
|
|
|
|
PG_FUNCTION_INFO_V1(get_raw_page_fork);
|
|
|
|
|
|
|
|
Datum
|
|
|
|
get_raw_page_fork(PG_FUNCTION_ARGS)
|
2007-05-18 03:11:25 +08:00
|
|
|
{
|
2017-03-13 07:35:34 +08:00
|
|
|
text *relname = PG_GETARG_TEXT_PP(0);
|
|
|
|
text *forkname = PG_GETARG_TEXT_PP(1);
|
2008-09-30 18:52:14 +08:00
|
|
|
uint32 blkno = PG_GETARG_UINT32(2);
|
2009-06-09 00:22:44 +08:00
|
|
|
bytea *raw_page;
|
2008-10-06 22:13:17 +08:00
|
|
|
ForkNumber forknum;
|
2007-05-18 03:11:25 +08:00
|
|
|
|
2009-06-09 00:22:44 +08:00
|
|
|
forknum = forkname_to_number(text_to_cstring(forkname));
|
|
|
|
|
|
|
|
raw_page = get_raw_page_internal(relname, forknum, blkno);
|
|
|
|
|
|
|
|
PG_RETURN_BYTEA_P(raw_page);
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* workhorse
|
|
|
|
*/
|
|
|
|
static bytea *
|
|
|
|
get_raw_page_internal(text *relname, ForkNumber forknum, BlockNumber blkno)
|
|
|
|
{
|
2007-11-16 05:14:46 +08:00
|
|
|
bytea *raw_page;
|
2009-06-09 00:22:44 +08:00
|
|
|
RangeVar *relrv;
|
|
|
|
Relation rel;
|
2007-11-16 05:14:46 +08:00
|
|
|
char *raw_page_data;
|
2007-05-18 03:11:25 +08:00
|
|
|
Buffer buf;
|
|
|
|
|
|
|
|
if (!superuser())
|
|
|
|
ereport(ERROR,
|
|
|
|
(errcode(ERRCODE_INSUFFICIENT_PRIVILEGE),
|
2020-01-31 00:32:04 +08:00
|
|
|
errmsg("must be superuser to use raw page functions")));
|
2007-05-18 03:11:25 +08:00
|
|
|
|
|
|
|
relrv = makeRangeVarFromNameList(textToQualifiedNameList(relname));
|
|
|
|
rel = relation_openrv(relrv, AccessShareLock);
|
|
|
|
|
|
|
|
/* Check that this relation has storage */
|
|
|
|
if (rel->rd_rel->relkind == RELKIND_VIEW)
|
|
|
|
ereport(ERROR,
|
|
|
|
(errcode(ERRCODE_WRONG_OBJECT_TYPE),
|
|
|
|
errmsg("cannot get raw page from view \"%s\"",
|
2007-11-16 05:14:46 +08:00
|
|
|
RelationGetRelationName(rel))));
|
2007-05-18 03:11:25 +08:00
|
|
|
if (rel->rd_rel->relkind == RELKIND_COMPOSITE_TYPE)
|
|
|
|
ereport(ERROR,
|
|
|
|
(errcode(ERRCODE_WRONG_OBJECT_TYPE),
|
|
|
|
errmsg("cannot get raw page from composite type \"%s\"",
|
2007-11-16 05:14:46 +08:00
|
|
|
RelationGetRelationName(rel))));
|
2011-01-02 12:48:11 +08:00
|
|
|
if (rel->rd_rel->relkind == RELKIND_FOREIGN_TABLE)
|
|
|
|
ereport(ERROR,
|
|
|
|
(errcode(ERRCODE_WRONG_OBJECT_TYPE),
|
|
|
|
errmsg("cannot get raw page from foreign table \"%s\"",
|
2017-03-10 05:34:25 +08:00
|
|
|
RelationGetRelationName(rel))));
|
|
|
|
if (rel->rd_rel->relkind == RELKIND_PARTITIONED_TABLE)
|
|
|
|
ereport(ERROR,
|
|
|
|
(errcode(ERRCODE_WRONG_OBJECT_TYPE),
|
|
|
|
errmsg("cannot get raw page from partitioned table \"%s\"",
|
2011-01-02 12:48:11 +08:00
|
|
|
RelationGetRelationName(rel))));
|
2018-05-10 01:03:43 +08:00
|
|
|
if (rel->rd_rel->relkind == RELKIND_PARTITIONED_INDEX)
|
|
|
|
ereport(ERROR,
|
|
|
|
(errcode(ERRCODE_WRONG_OBJECT_TYPE),
|
|
|
|
errmsg("cannot get raw page from partitioned index \"%s\"",
|
|
|
|
RelationGetRelationName(rel))));
|
2007-05-18 03:11:25 +08:00
|
|
|
|
2009-04-01 06:54:31 +08:00
|
|
|
/*
|
2009-06-11 22:49:15 +08:00
|
|
|
* Reject attempts to read non-local temporary relations; we would be
|
|
|
|
* likely to get wrong data since we have no visibility into the owning
|
|
|
|
* session's local buffers.
|
2009-04-01 06:54:31 +08:00
|
|
|
*/
|
|
|
|
if (RELATION_IS_OTHER_TEMP(rel))
|
|
|
|
ereport(ERROR,
|
|
|
|
(errcode(ERRCODE_FEATURE_NOT_SUPPORTED),
|
|
|
|
errmsg("cannot access temporary tables of other sessions")));
|
|
|
|
|
2014-07-22 23:45:46 +08:00
|
|
|
if (blkno >= RelationGetNumberOfBlocksInFork(rel, forknum))
|
|
|
|
ereport(ERROR,
|
|
|
|
(errcode(ERRCODE_INVALID_PARAMETER_VALUE),
|
|
|
|
errmsg("block number %u is out of range for relation \"%s\"",
|
|
|
|
blkno, RelationGetRelationName(rel))));
|
2007-05-18 03:11:25 +08:00
|
|
|
|
|
|
|
/* Initialize buffer to copy to */
|
|
|
|
raw_page = (bytea *) palloc(BLCKSZ + VARHDRSZ);
|
|
|
|
SET_VARSIZE(raw_page, BLCKSZ + VARHDRSZ);
|
|
|
|
raw_page_data = VARDATA(raw_page);
|
|
|
|
|
|
|
|
/* Take a verbatim copy of the page */
|
|
|
|
|
Unite ReadBufferWithFork, ReadBufferWithStrategy, and ZeroOrReadBuffer
functions into one ReadBufferExtended function, that takes the strategy
and mode as argument. There's three modes, RBM_NORMAL which is the default
used by plain ReadBuffer(), RBM_ZERO, which replaces ZeroOrReadBuffer, and
a new mode RBM_ZERO_ON_ERROR, which allows callers to read corrupt pages
without throwing an error. The FSM needs the new mode to recover from
corrupt pages, which could happend if we crash after extending an FSM file,
and the new page is "torn".
Add fork number to some error messages in bufmgr.c, that still lacked it.
2008-10-31 23:05:00 +08:00
|
|
|
buf = ReadBufferExtended(rel, forknum, blkno, RBM_NORMAL, NULL);
|
2007-05-18 03:11:25 +08:00
|
|
|
LockBuffer(buf, BUFFER_LOCK_SHARE);
|
|
|
|
|
2016-04-20 21:31:19 +08:00
|
|
|
memcpy(raw_page_data, BufferGetPage(buf), BLCKSZ);
|
2007-05-18 03:11:25 +08:00
|
|
|
|
|
|
|
LockBuffer(buf, BUFFER_LOCK_UNLOCK);
|
|
|
|
ReleaseBuffer(buf);
|
|
|
|
|
|
|
|
relation_close(rel, AccessShareLock);
|
|
|
|
|
2009-06-09 00:22:44 +08:00
|
|
|
return raw_page;
|
2007-05-18 03:11:25 +08:00
|
|
|
}
|
|
|
|
|
2017-02-04 00:34:41 +08:00
|
|
|
|
|
|
|
/*
|
|
|
|
* get_page_from_raw
|
|
|
|
*
|
|
|
|
* Get a palloc'd, maxalign'ed page image from the result of get_raw_page()
|
|
|
|
*
|
|
|
|
* On machines with MAXALIGN = 8, the payload of a bytea is not maxaligned,
|
|
|
|
* since it will start 4 bytes into a palloc'd value. On alignment-picky
|
|
|
|
* machines, this will cause failures in accesses to 8-byte-wide values
|
|
|
|
* within the page. We don't need to worry if accessing only 4-byte or
|
|
|
|
* smaller fields, but when examining a struct that contains 8-byte fields,
|
|
|
|
* use this function for safety.
|
|
|
|
*/
|
|
|
|
Page
|
|
|
|
get_page_from_raw(bytea *raw_page)
|
|
|
|
{
|
|
|
|
Page page;
|
|
|
|
int raw_page_size;
|
|
|
|
|
2017-03-13 07:35:34 +08:00
|
|
|
raw_page_size = VARSIZE_ANY_EXHDR(raw_page);
|
2017-02-04 00:34:41 +08:00
|
|
|
|
|
|
|
if (raw_page_size != BLCKSZ)
|
|
|
|
ereport(ERROR,
|
|
|
|
(errcode(ERRCODE_INVALID_PARAMETER_VALUE),
|
|
|
|
errmsg("invalid page size"),
|
|
|
|
errdetail("Expected %d bytes, got %d.",
|
|
|
|
BLCKSZ, raw_page_size)));
|
|
|
|
|
|
|
|
page = palloc(raw_page_size);
|
|
|
|
|
2017-03-13 07:35:34 +08:00
|
|
|
memcpy(page, VARDATA_ANY(raw_page), raw_page_size);
|
2017-02-04 00:34:41 +08:00
|
|
|
|
|
|
|
return page;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
2007-05-18 03:11:25 +08:00
|
|
|
/*
|
|
|
|
* page_header
|
|
|
|
*
|
|
|
|
* Allows inspection of page header fields of a raw page
|
|
|
|
*/
|
|
|
|
|
|
|
|
PG_FUNCTION_INFO_V1(page_header);
|
|
|
|
|
|
|
|
Datum
|
|
|
|
page_header(PG_FUNCTION_ARGS)
|
|
|
|
{
|
|
|
|
bytea *raw_page = PG_GETARG_BYTEA_P(0);
|
|
|
|
int raw_page_size;
|
|
|
|
|
|
|
|
TupleDesc tupdesc;
|
|
|
|
|
|
|
|
Datum result;
|
|
|
|
HeapTuple tuple;
|
2007-09-22 05:25:42 +08:00
|
|
|
Datum values[9];
|
|
|
|
bool nulls[9];
|
2007-05-18 03:11:25 +08:00
|
|
|
|
|
|
|
PageHeader page;
|
|
|
|
XLogRecPtr lsn;
|
|
|
|
|
|
|
|
if (!superuser())
|
|
|
|
ereport(ERROR,
|
|
|
|
(errcode(ERRCODE_INSUFFICIENT_PRIVILEGE),
|
2020-01-31 00:32:04 +08:00
|
|
|
errmsg("must be superuser to use raw page functions")));
|
2007-05-18 03:11:25 +08:00
|
|
|
|
|
|
|
raw_page_size = VARSIZE(raw_page) - VARHDRSZ;
|
|
|
|
|
|
|
|
/*
|
2007-11-16 05:14:46 +08:00
|
|
|
* Check that enough data was supplied, so that we don't try to access
|
|
|
|
* fields outside the supplied buffer.
|
2007-05-18 03:11:25 +08:00
|
|
|
*/
|
2015-02-20 13:11:42 +08:00
|
|
|
if (raw_page_size < SizeOfPageHeaderData)
|
2007-11-16 05:14:46 +08:00
|
|
|
ereport(ERROR,
|
|
|
|
(errcode(ERRCODE_INVALID_PARAMETER_VALUE),
|
|
|
|
errmsg("input page too small (%d bytes)", raw_page_size)));
|
2007-05-18 03:11:25 +08:00
|
|
|
|
|
|
|
page = (PageHeader) VARDATA(raw_page);
|
|
|
|
|
|
|
|
/* Build a tuple descriptor for our result type */
|
|
|
|
if (get_call_result_type(fcinfo, NULL, &tupdesc) != TYPEFUNC_COMPOSITE)
|
|
|
|
elog(ERROR, "return type must be a row type");
|
|
|
|
|
|
|
|
/* Extract information from the page header */
|
|
|
|
|
|
|
|
lsn = PageGetLSN(page);
|
|
|
|
|
2014-03-03 20:14:31 +08:00
|
|
|
/* pageinspect >= 1.2 uses pg_lsn instead of text for the LSN field. */
|
2017-08-21 02:19:07 +08:00
|
|
|
if (TupleDescAttr(tupdesc, 0)->atttypid == TEXTOID)
|
2014-03-03 20:14:31 +08:00
|
|
|
{
|
2014-05-07 00:12:18 +08:00
|
|
|
char lsnchar[64];
|
|
|
|
|
2014-03-03 20:14:31 +08:00
|
|
|
snprintf(lsnchar, sizeof(lsnchar), "%X/%X",
|
|
|
|
(uint32) (lsn >> 32), (uint32) lsn);
|
|
|
|
values[0] = CStringGetTextDatum(lsnchar);
|
|
|
|
}
|
|
|
|
else
|
|
|
|
values[0] = LSNGetDatum(lsn);
|
2013-03-18 21:46:42 +08:00
|
|
|
values[1] = UInt16GetDatum(page->pd_checksum);
|
2007-05-18 03:11:25 +08:00
|
|
|
values[2] = UInt16GetDatum(page->pd_flags);
|
|
|
|
values[3] = UInt16GetDatum(page->pd_lower);
|
|
|
|
values[4] = UInt16GetDatum(page->pd_upper);
|
|
|
|
values[5] = UInt16GetDatum(page->pd_special);
|
|
|
|
values[6] = UInt16GetDatum(PageGetPageSize(page));
|
|
|
|
values[7] = UInt16GetDatum(PageGetPageLayoutVersion(page));
|
2007-09-22 05:25:42 +08:00
|
|
|
values[8] = TransactionIdGetDatum(page->pd_prune_xid);
|
2007-05-18 03:11:25 +08:00
|
|
|
|
2007-11-16 05:14:46 +08:00
|
|
|
/* Build and return the tuple. */
|
2007-05-18 03:11:25 +08:00
|
|
|
|
|
|
|
memset(nulls, 0, sizeof(nulls));
|
|
|
|
|
2007-11-16 05:14:46 +08:00
|
|
|
tuple = heap_form_tuple(tupdesc, values, nulls);
|
|
|
|
result = HeapTupleGetDatum(tuple);
|
2007-05-18 03:11:25 +08:00
|
|
|
|
|
|
|
PG_RETURN_DATUM(result);
|
|
|
|
}
|
2017-03-17 21:49:10 +08:00
|
|
|
|
|
|
|
/*
|
|
|
|
* page_checksum
|
|
|
|
*
|
|
|
|
* Compute checksum of a raw page
|
|
|
|
*/
|
|
|
|
|
|
|
|
PG_FUNCTION_INFO_V1(page_checksum);
|
|
|
|
|
|
|
|
Datum
|
|
|
|
page_checksum(PG_FUNCTION_ARGS)
|
|
|
|
{
|
|
|
|
bytea *raw_page = PG_GETARG_BYTEA_P(0);
|
|
|
|
uint32 blkno = PG_GETARG_INT32(1);
|
|
|
|
int raw_page_size;
|
|
|
|
PageHeader page;
|
|
|
|
|
|
|
|
if (!superuser())
|
|
|
|
ereport(ERROR,
|
|
|
|
(errcode(ERRCODE_INSUFFICIENT_PRIVILEGE),
|
2020-01-31 00:32:04 +08:00
|
|
|
errmsg("must be superuser to use raw page functions")));
|
2017-03-17 21:49:10 +08:00
|
|
|
|
|
|
|
raw_page_size = VARSIZE(raw_page) - VARHDRSZ;
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Check that the supplied page is of the right size.
|
|
|
|
*/
|
|
|
|
if (raw_page_size != BLCKSZ)
|
|
|
|
ereport(ERROR,
|
|
|
|
(errcode(ERRCODE_INVALID_PARAMETER_VALUE),
|
Phase 3 of pgindent updates.
Don't move parenthesized lines to the left, even if that means they
flow past the right margin.
By default, BSD indent lines up statement continuation lines that are
within parentheses so that they start just to the right of the preceding
left parenthesis. However, traditionally, if that resulted in the
continuation line extending to the right of the desired right margin,
then indent would push it left just far enough to not overrun the margin,
if it could do so without making the continuation line start to the left of
the current statement indent. That makes for a weird mix of indentations
unless one has been completely rigid about never violating the 80-column
limit.
This behavior has been pretty universally panned by Postgres developers.
Hence, disable it with indent's new -lpl switch, so that parenthesized
lines are always lined up with the preceding left paren.
This patch is much less interesting than the first round of indent
changes, but also bulkier, so I thought it best to separate the effects.
Discussion: https://postgr.es/m/E1dAmxK-0006EE-1r@gemulon.postgresql.org
Discussion: https://postgr.es/m/30527.1495162840@sss.pgh.pa.us
2017-06-22 03:35:54 +08:00
|
|
|
errmsg("incorrect size of input page (%d bytes)", raw_page_size)));
|
2017-03-17 21:49:10 +08:00
|
|
|
|
|
|
|
page = (PageHeader) VARDATA(raw_page);
|
|
|
|
|
2017-05-18 04:31:56 +08:00
|
|
|
PG_RETURN_INT16(pg_checksum_page((char *) page, blkno));
|
2017-03-17 21:49:10 +08:00
|
|
|
}
|