Fail if recovery target is not reached

author Peter Eisentraut <peter@eisentraut.org>

Wed, 29 Jan 2020 14:43:32 +0000 (15:43 +0100)

committer Peter Eisentraut <peter@eisentraut.org>

Wed, 29 Jan 2020 14:58:14 +0000 (15:58 +0100)
author Peter Eisentraut <peter@eisentraut.org>
Wed, 29 Jan 2020 14:43:32 +0000 (15:43 +0100)
committer Peter Eisentraut <peter@eisentraut.org>
Wed, 29 Jan 2020 14:58:14 +0000 (15:58 +0100)
diff --git a/doc/src/sgml/config.sgml b/doc/src/sgml/config.sgml

index e07dc01e8024cb006b93a09d1f21b9f69cecd331..c1128f89ec7707f614a4e3d440a6eb5838774b18 100644 (file)
--- a/doc/src/sgml/config.sgml
+++ b/doc/src/sgml/config.sgml
@@ -3571,6 +3571,11 @@ restore_command = 'copy "C:\\server\\archivedir\\%f" "%p"'  # Windows
          If <xref linkend="guc-hot-standby"/> is not enabled, a setting of
          <literal>pause</literal> will act the same as <literal>shutdown</literal>.
         </para>
+       <para>
+        In any case, if a recovery target is configured but the archive
+        recovery ends before the target is reached, the server will shut down
+        with a fatal error.
+       </para>
        </listitem>
       </varlistentry>
  
diff --git a/src/backend/access/transam/xlog.c b/src/backend/access/transam/xlog.c

index 6e09ded5974fe26716ef4e32941f2ff407470510..3813eadfb49a19351e7836e424583e3a0bece571 100644 (file)
--- a/src/backend/access/transam/xlog.c
+++ b/src/backend/access/transam/xlog.c
@@ -6200,7 +6200,7 @@ StartupXLOG(void)
     XLogCtlInsert *Insert;
     CheckPoint  checkPoint;
     bool        wasShutdown;
-   bool        reachedStopPoint = false;
+   bool        reachedRecoveryTarget = false;
     bool        haveBackupLabel = false;
     bool        haveTblspcMap = false;
     XLogRecPtr  RecPtr,
@@ -7103,7 +7103,7 @@ StartupXLOG(void)
                  */
                 if (recoveryStopsBefore(xlogreader))
                 {
-                   reachedStopPoint = true;    /* see below */
+                   reachedRecoveryTarget = true;
                     break;
                 }
  
@@ -7258,7 +7258,7 @@ StartupXLOG(void)
                 /* Exit loop if we reached inclusive recovery target */
                 if (recoveryStopsAfter(xlogreader))
                 {
-                   reachedStopPoint = true;
+                   reachedRecoveryTarget = true;
                     break;
                 }
  
@@ -7270,7 +7270,7 @@ StartupXLOG(void)
              * end of main redo apply loop
              */
  
-           if (reachedStopPoint)
+           if (reachedRecoveryTarget)
             {
                 if (!reachedConsistency)
                     ereport(FATAL,
@@ -7327,7 +7327,18 @@ StartupXLOG(void)
             /* there are no WAL records following the checkpoint */
             ereport(LOG,
                     (errmsg("redo is not required")));
+
         }
+
+       /*
+        * This check is intentionally after the above log messages that
+        * indicate how far recovery went.
+        */
+       if (ArchiveRecoveryRequested &&
+           recoveryTarget != RECOVERY_TARGET_UNSET &&
+           !reachedRecoveryTarget)
+           ereport(FATAL,
+                   (errmsg("recovery ended before configured recovery target was reached")));
     }
  
     /*
diff --git a/src/test/perl/PostgresNode.pm b/src/test/perl/PostgresNode.pm

index 2e0cf4a2f3ebf4218d83c364a3ba5244229be250..bf095a7adb768195468eafd87f65e28f68bb524f 100644 (file)
--- a/src/test/perl/PostgresNode.pm
+++ b/src/test/perl/PostgresNode.pm
@@ -653,6 +653,9 @@ Restoring WAL segments from archives using restore_command can be enabled
  by passing the keyword parameter has_restoring => 1. This is disabled by
  default.
  
+If has_restoring is used, standby mode is used by default.  To use
+recovery mode instead, pass the keyword parameter standby => 0.
+
  The backup is copied, leaving the original unmodified. pg_hba.conf is
  unconditionally set to enable replication connections.
  
@@ -669,6 +672,7 @@ sub init_from_backup
  
     $params{has_streaming} = 0 unless defined $params{has_streaming};
     $params{has_restoring} = 0 unless defined $params{has_restoring};
+   $params{standby} = 1 unless defined $params{standby};
  
     print
       "# Initializing node \"$node_name\" from backup \"$backup_name\" of node \"$root_name\"\n";
@@ -699,7 +703,7 @@ port = $port
             "unix_socket_directories = '$host'");
     }
     $self->enable_streaming($root_node) if $params{has_streaming};
-   $self->enable_restoring($root_node) if $params{has_restoring};
+   $self->enable_restoring($root_node, $params{standby}) if $params{has_restoring};
     return;
  }
  
@@ -939,7 +943,7 @@ primary_conninfo='$root_connstr'
  # Internal routine to enable archive recovery command on a standby node
  sub enable_restoring
  {
-   my ($self, $root_node) = @_;
+   my ($self, $root_node, $standby) = @_;
     my $path = TestLib::perl2host($root_node->archive_dir);
     my $name = $self->name;
  
@@ -961,7 +965,30 @@ sub enable_restoring
         'postgresql.conf', qq(
  restore_command = '$copy_command'
  ));
-   $self->set_standby_mode();
+   if ($standby)
+   {
+       $self->set_standby_mode();
+   }
+   else
+   {
+       $self->set_recovery_mode();
+   }
+   return;
+}
+
+=pod
+
+=item $node->set_recovery_mode()
+
+Place recovery.signal file.
+
+=cut
+
+sub set_recovery_mode
+{
+   my ($self) = @_;
+
+   $self->append_conf('recovery.signal', '');
     return;
  }
  
diff --git a/src/test/recovery/t/003_recovery_targets.pl b/src/test/recovery/t/003_recovery_targets.pl

index d8fbd500112fb94631b5fb14427410fc8192d031..fd14bab208bd139b6a03ab84b57c4df9911b2de3 100644 (file)
--- a/src/test/recovery/t/003_recovery_targets.pl
+++ b/src/test/recovery/t/003_recovery_targets.pl
@@ -3,7 +3,8 @@ use strict;
  use warnings;
  use PostgresNode;
  use TestLib;
-use Test::More tests => 8;
+use Test::More tests => 9;
+use Time::HiRes qw(usleep);
  
  # Create and test a standby from given backup, with a certain recovery target.
  # Choose $until_lsn later than the transaction commit that causes the row
@@ -145,3 +146,24 @@ ok(!$res, 'invalid recovery startup fails');
  my $logfile = slurp_file($node_standby->logfile());
  ok($logfile =~ qr/multiple recovery targets specified/,
     'multiple conflicting settings');
+
+# Check behavior when recovery ends before target is reached
+
+$node_standby = get_new_node('standby_8');
+$node_standby->init_from_backup($node_master, 'my_backup',
+                               has_restoring => 1, standby => 0);
+$node_standby->append_conf('postgresql.conf',
+                          "recovery_target_name = 'does_not_exist'");
+
+run_log(['pg_ctl', '-D', $node_standby->data_dir,
+        '-l', $node_standby->logfile, 'start']);
+
+# wait up to 10 seconds for postgres to terminate
+foreach my $i (0..100)
+{
+   last if ! -f $node_standby->data_dir . '/postmaster.pid';
+   usleep(100_000);
+}
+$logfile = slurp_file($node_standby->logfile());
+ok($logfile =~ qr/FATAL:  recovery ended before configured recovery target was reached/,
+   'recovery end before target reached is a fatal error');
author	Peter Eisentraut <peter@eisentraut.org>
	Wed, 29 Jan 2020 14:43:32 +0000 (15:43 +0100)
committer	Peter Eisentraut <peter@eisentraut.org>
	Wed, 29 Jan 2020 14:58:14 +0000 (15:58 +0100)
doc/src/sgml/config.sgml		patch \| blob \| blame \| history
src/backend/access/transam/xlog.c		patch \| blob \| blame \| history
src/test/perl/PostgresNode.pm		patch \| blob \| blame \| history
src/test/recovery/t/003_recovery_targets.pl		patch \| blob \| blame \| history