Behave Tablespace Tests: fix cleanup race condition

Without synchronous_commit = 'remote_apply' introduced in 9.6, there is no guarantee that the mirrors have removed their tablespace directories by the time the DROP TABLESPACE command returns. We need those directories to no longer be in use by the mirrors before removing them. We are using the PL/PGSQL function checkpoint_and_wait_for_replication_replay() from src/test/walrep/sql/missing_xlog.sql to achieve the same semantics as 'remote_apply'. Co-authored-by: N Jacob Champion <pchampion@pivotal.io>

Behave Tablespace Tests: fix cleanup race condition
Without synchronous_commit = 'remote_apply' introduced in 9.6, there is no guarantee that the mirrors have removed their tablespace directories by the time the DROP TABLESPACE command returns. We need those directories to no longer be in use by the mirrors before removing them. We are using the PL/PGSQL function checkpoint_and_wait_for_replication_replay() from src/test/walrep/sql/missing_xlog.sql to achieve the same semantics as 'remote_apply'. Co-authored-by: N Jacob Champion <pchampion@pivotal.io>
a6bb6e3e · Kalen Krempely · Kalen Krempely · 971b2eb0 · a6bb6e3e
隐藏空白更改
内联并排

Showing with 79 addition and 1 deletion

gpMgmt/test/behave/mgmt_utils/steps/tablespace_mgmt_utils.py gpMgmt/test/behave/mgmt_utils/steps/tablespace_mgmt_utils.py +79 -1

未找到文件。
--- a/gpMgmt/test/behave/mgmt_utils/steps/tablespace_mgmt_utils.py
+++ b/gpMgmt/test/behave/mgmt_utils/steps/tablespace_mgmt_utils.py
@@ -28,11 +28,18 @@ class Tablespace:
            self.initial_data = db.query("SELECT gp_segment_id, i FROM tbl").getresult()

    def cleanup(self):
-        with dbconn.connect(dbconn.DbURL()) as conn:
+        with dbconn.connect(dbconn.DbURL(dbname="postgres")) as conn:
            db = pg.DB(conn)
            db.query("DROP DATABASE IF EXISTS %s" % self.dbname)
            db.query("DROP TABLESPACE IF EXISTS %s" % self.name)

+            # Without synchronous_commit = 'remote_apply' introduced in 9.6, there
+            # is no guarantee that the mirrors have removed their tablespace
+            # directories by the time the DROP TABLESPACE command returns.
+            # We need those directories to no longer be in use by the mirrors
+            # before removing them below.
+            _checkpoint_and_wait_for_replication_replay(db)
+
        shutil.rmtree(self.path)

    def verify(self):
@@ -55,6 +62,77 @@ class Tablespace:
                sorted(self.initial_data), sorted(data)))


+def _checkpoint_and_wait_for_replication_replay(db):
+    """
+    Taken from src/test/walrep/sql/missing_xlog.sql
+    """
+    db.query("""
+-- checkpoint to ensure clean xlog replication before bring down mirror
+create or replace function checkpoint_and_wait_for_replication_replay (retries int) returns bool as
+$$
+declare
+	i int;
+	checkpoint_locs pg_lsn[];
+	replay_locs pg_lsn[];
+	failed_for_segment text[];
+	r record;
+	all_caught_up bool;
+begin
+	i := 0;
+
+	-- Issue a checkpoint.
+	checkpoint;
+
+	-- Get the WAL positions after the checkpoint records on every segment.
+	for r in select gp_segment_id, pg_current_xlog_location() as loc from gp_dist_random('gp_id') loop
+		checkpoint_locs[r.gp_segment_id] = r.loc;
+	end loop;
+	-- and the QD, too.
+	checkpoint_locs[-1] = pg_current_xlog_location();
+
+	-- Force some WAL activity, to nudge the mirrors to replay past the
+	-- checkpoint location. There are some cases where a non-transactional
+	-- WAL record is created right after the checkpoint record, which
+	-- doesn't get replayed on the mirror until something else forces it
+	-- out.
+	drop table if exists dummy;
+	create temp table dummy (id int4) distributed randomly;
+
+	-- Wait until all mirrors have replayed up to the location we
+	-- memorized above.
+	loop
+		all_caught_up = true;
+		for r in select gp_segment_id, replay_location as loc from gp_stat_replication loop
+			replay_locs[r.gp_segment_id] = r.loc;
+			if r.loc < checkpoint_locs[r.gp_segment_id] then
+				all_caught_up = false;
+				failed_for_segment[r.gp_segment_id] = 1;
+			else
+				failed_for_segment[r.gp_segment_id] = 0;
+			end if;
+		end loop;
+
+		if all_caught_up then
+			return true;
+		end if;
+
+		if i >= retries then
+			RAISE INFO 'checkpoint_locs:    %', checkpoint_locs;
+			RAISE INFO 'replay_locs:        %', replay_locs;
+			RAISE INFO 'failed_for_segment: %', failed_for_segment;
+			return false;
+		end if;
+		perform pg_sleep(0.1);
+		i := i + 1;
+	end loop;
+end;
+$$ language plpgsql;
+
+SELECT checkpoint_and_wait_for_replication_replay(0);
+DROP FUNCTION checkpoint_and_wait_for_replication_replay(int);
+    """)
+
+
 @given('a tablespace is created with data')
 def impl(context):
    _create_tablespace_with_data(context, "outerspace")