mirror of
				https://github.com/postgres/postgres.git
				synced 2025-11-04 00:02:52 -05:00 
			
		
		
		
	The WAL receiver and WAL summarizer processes gain each one a call to pgstat_report_wal(), to make sure that they report their WAL statistics to pgstats, gathering data for pg_stat_io. In the WAL receiver, the stats reports are timed with status updates sent to the primary, that depend on wal_receiver_status_interval and wal_receiver_timeout. This is a conservative choice, but perhaps we could be more aggressive with the frequency of the stats reports. An interesting historical fact is that the WAL receiver does writes and syncs of WAL, but it has never reported its statistics to pgstats in pg_stat_wal. In the WAL summarizer, the stats reports are done each time the process waits for WAL. While on it, pg_stat_io is adjusted so as these two processes do not report any rows when IOObject is not WAL, making the view easier to use with less rows. Two tests are added in TAP, checking statistics for the WAL summarizer and the WAL receiver. Status updates in the WAL receiver are currently possible in the recovery test 001_stream_rep.pl. Reviewed-by: Bertrand Drouvot <bertranddrouvot.pg@gmail.com> Discussion: https://postgr.es/m/Z8UKZyVSHUUQJHNb@paquier.xyz
		
			
				
	
	
		
			105 lines
		
	
	
		
			3.4 KiB
		
	
	
	
		
			Perl
		
	
	
	
	
	
			
		
		
	
	
			105 lines
		
	
	
		
			3.4 KiB
		
	
	
	
		
			Perl
		
	
	
	
	
	
# Copyright (c) 2021-2025, PostgreSQL Global Development Group
 | 
						|
 | 
						|
use strict;
 | 
						|
use warnings FATAL => 'all';
 | 
						|
use File::Compare;
 | 
						|
use PostgreSQL::Test::Cluster;
 | 
						|
use PostgreSQL::Test::Utils;
 | 
						|
use Test::More;
 | 
						|
 | 
						|
# Set up a new database instance.
 | 
						|
my $node1 = PostgreSQL::Test::Cluster->new('node1');
 | 
						|
$node1->init(has_archiving => 1, allows_streaming => 1);
 | 
						|
$node1->append_conf('postgresql.conf', 'summarize_wal = on');
 | 
						|
$node1->start;
 | 
						|
 | 
						|
# Create a table and insert a few test rows into it. VACUUM FREEZE it so that
 | 
						|
# autovacuum doesn't induce any future modifications unexpectedly. Then
 | 
						|
# trigger a checkpoint.
 | 
						|
$node1->safe_psql('postgres', <<EOM);
 | 
						|
CREATE TABLE mytable (a int, b text);
 | 
						|
INSERT INTO mytable
 | 
						|
SELECT
 | 
						|
	g, random()::text||random()::text||random()::text||random()::text
 | 
						|
FROM
 | 
						|
	generate_series(1, 400) g;
 | 
						|
VACUUM FREEZE;
 | 
						|
EOM
 | 
						|
 | 
						|
# Record the current WAL insert LSN.
 | 
						|
my $base_lsn = $node1->safe_psql('postgres', <<EOM);
 | 
						|
SELECT pg_current_wal_insert_lsn()
 | 
						|
EOM
 | 
						|
note("just after insert, WAL insert LSN is $base_lsn");
 | 
						|
 | 
						|
# Now perform a CHECKPOINT.
 | 
						|
$node1->safe_psql('postgres', <<EOM);
 | 
						|
CHECKPOINT;
 | 
						|
EOM
 | 
						|
 | 
						|
# Wait for a new summary to show up, one that includes the inserts we just did.
 | 
						|
my $result = $node1->poll_query_until('postgres', <<EOM);
 | 
						|
SELECT EXISTS (
 | 
						|
    SELECT * from pg_available_wal_summaries()
 | 
						|
    WHERE end_lsn >= '$base_lsn'
 | 
						|
)
 | 
						|
EOM
 | 
						|
ok($result, "WAL summarization caught up after insert");
 | 
						|
 | 
						|
# The WAL summarizer should have generated some IO statistics.
 | 
						|
my $stats_reads = $node1->safe_psql(
 | 
						|
	'postgres',
 | 
						|
	qq{SELECT sum(reads) > 0 FROM pg_stat_io
 | 
						|
   WHERE backend_type = 'walsummarizer' AND object = 'wal'});
 | 
						|
is($stats_reads, 't', "WAL summarizer generates statistics for WAL reads");
 | 
						|
 | 
						|
# Find the highest LSN that is summarized on disk.
 | 
						|
my $summarized_lsn = $node1->safe_psql('postgres', <<EOM);
 | 
						|
SELECT MAX(end_lsn) AS summarized_lsn FROM pg_available_wal_summaries()
 | 
						|
EOM
 | 
						|
note("after insert, summarized through $summarized_lsn");
 | 
						|
 | 
						|
# Update a row in the first block of the table and trigger a checkpoint.
 | 
						|
$node1->safe_psql('postgres', <<EOM);
 | 
						|
UPDATE mytable SET b = 'abcdefghijklmnopqrstuvwxyz' || b || '01234567890'
 | 
						|
	WHERE a = 2;
 | 
						|
CHECKPOINT;
 | 
						|
EOM
 | 
						|
 | 
						|
# Wait for a new summary to show up.
 | 
						|
$result = $node1->poll_query_until('postgres', <<EOM);
 | 
						|
SELECT EXISTS (
 | 
						|
    SELECT * from pg_available_wal_summaries()
 | 
						|
    WHERE end_lsn > '$summarized_lsn'
 | 
						|
)
 | 
						|
EOM
 | 
						|
ok($result, "got new WAL summary after update");
 | 
						|
 | 
						|
# Figure out the exact details for the new summary file.
 | 
						|
my $details = $node1->safe_psql('postgres', <<EOM);
 | 
						|
SELECT tli, start_lsn, end_lsn from pg_available_wal_summaries()
 | 
						|
	WHERE end_lsn > '$summarized_lsn'
 | 
						|
EOM
 | 
						|
my @lines = split(/\n/, $details);
 | 
						|
is(0 + @lines, 1, "got exactly one new WAL summary");
 | 
						|
my ($tli, $start_lsn, $end_lsn) = split(/\|/, $lines[0]);
 | 
						|
note("examining summary for TLI $tli from $start_lsn to $end_lsn");
 | 
						|
 | 
						|
# Reconstruct the full pathname for the WAL summary file.
 | 
						|
my $filename = sprintf "%s/pg_wal/summaries/%08s%08s%08s%08s%08s.summary",
 | 
						|
  $node1->data_dir, $tli,
 | 
						|
  split(m@/@, $start_lsn),
 | 
						|
  split(m@/@, $end_lsn);
 | 
						|
ok(-f $filename, "WAL summary file exists");
 | 
						|
 | 
						|
# Run pg_walsummary on it. We expect exactly two blocks to be modified,
 | 
						|
# block 0 and one other.
 | 
						|
my ($stdout, $stderr) = run_command([ 'pg_walsummary', '-i', $filename ]);
 | 
						|
note($stdout);
 | 
						|
@lines = split(/\n/, $stdout);
 | 
						|
like($stdout, qr/FORK main: block 0$/m, "stdout shows block 0 modified");
 | 
						|
is($stderr, '', 'stderr is empty');
 | 
						|
is(0 + @lines, 2, "UPDATE modified 2 blocks");
 | 
						|
 | 
						|
done_testing();
 |