diff --git a/src/yb/integration-tests/cdcsdk_ysql-test.cc b/src/yb/integration-tests/cdcsdk_ysql-test.cc index 78d4939ea5c2..63814fe54ea8 100644 --- a/src/yb/integration-tests/cdcsdk_ysql-test.cc +++ b/src/yb/integration-tests/cdcsdk_ysql-test.cc @@ -7855,5 +7855,361 @@ TEST_F(CDCSDKYsqlTest, TestNonUserTableShouldNotGetAddedToConsistentSnapshotCDCS TestNonUserTableShouldNotGetAddedToCDCStream(/* create_consistent_snapshot_stream */ true); } +void CDCSDKYsqlTest::TestDisableOfDynamicTableAdditionOnCDCStream( + bool use_consistent_snapshot_stream) { + ANNOTATE_UNPROTECTED_WRITE(FLAGS_yb_enable_cdc_consistent_snapshot_streams) = + use_consistent_snapshot_stream; + ANNOTATE_UNPROTECTED_WRITE(FLAGS_catalog_manager_bg_task_wait_ms) = 100; + ANNOTATE_UNPROTECTED_WRITE(FLAGS_cdcsdk_enable_dynamic_tables_disable_option) = true; + // Setup cluster. + ASSERT_OK(SetUpWithParams(3, 3, false)); + + const vector table_list_suffix = {"_0", "_1", "_2", "_3", "_4"}; + const int kNumTables = 5; + vector table(kNumTables); + int idx = 0; + vector> tablets(kNumTables); + + // Create and populate data in the first two tables. + for (idx = 0; idx < 2; idx++) { + table[idx] = ASSERT_RESULT(CreateTable( + &test_cluster_, kNamespaceName, kTableName, 1, true, false, 0, true, + table_list_suffix[idx])); + ASSERT_OK(test_client()->GetTablets( + table[idx], 0, &tablets[idx], /* partition_list_version = */ nullptr)); + ASSERT_OK(WriteEnumsRows( + 0 /* start */, 100 /* end */, &test_cluster_, table_list_suffix[idx], kNamespaceName, + kTableName)); + } + + auto stream_id1 = use_consistent_snapshot_stream ? ASSERT_RESULT(CreateConsistentSnapshotStream()) + : ASSERT_RESULT(CreateDBStream(EXPLICIT)); + auto stream_id2 = use_consistent_snapshot_stream ? ASSERT_RESULT(CreateConsistentSnapshotStream()) + : ASSERT_RESULT(CreateDBStream(EXPLICIT)); + + std::unordered_set expected_table_ids = {table[0].table_id(), table[1].table_id()}; + VerifyTablesInStreamMetadata( + stream_id1, expected_table_ids, "Waiting for stream metadata after stream creation."); + VerifyTablesInStreamMetadata( + stream_id2, expected_table_ids, "Waiting for stream metadata after stream creation."); + + // Since dynamic table addition is not yet disabled, create a new table and verify that it gets + // added to stream metadata of both the streams. + table[idx] = ASSERT_RESULT(CreateTable( + &test_cluster_, kNamespaceName, kTableName, 1, true, false, 0, true, table_list_suffix[idx])); + ASSERT_OK(test_client()->GetTablets( + table[idx], 0, &tablets[idx], /* partition_list_version = */ nullptr)); + idx += 1; + + expected_table_ids.insert(table[idx - 1].table_id()); + VerifyTablesInStreamMetadata( + stream_id1, expected_table_ids, "Waiting for GetDBStreamInfo after creating a new table."); + VerifyTablesInStreamMetadata( + stream_id2, expected_table_ids, "Waiting for GetDBStreamInfo after creating a new table."); + + // Disable dynamic table addition on stream1 via the yb-admin command. + ASSERT_OK(DisableDynamicTableAdditionOnCDCSDKStream(stream_id1)); + + // Create a new table and verify that it only gets added to stream2's metadata. + table[idx] = ASSERT_RESULT(CreateTable( + &test_cluster_, kNamespaceName, kTableName, 1, true, false, 0, true, table_list_suffix[idx])); + ASSERT_OK(test_client()->GetTablets( + table[idx], 0, &tablets[idx], /* partition_list_version = */ nullptr)); + idx += 1; + + // wait for the bg thread responsible for dynamic table addition to complete its processing. + SleepFor(MonoDelta::FromSeconds(2 * kTimeMultiplier)); + + // Stream1's metadata should not contain table_4 as dynamic table addition is disabled. Therefore, + // the expected set of tables remains same as before. + VerifyTablesInStreamMetadata( + stream_id1, expected_table_ids, + "Waiting for GetDBStreamInfo after disabling dynamic table addition on stream1."); + + // Stream2's metadata should contain table_4 as dynamic table addition is not disabled. + auto expected_table_ids_for_stream2 = expected_table_ids; + expected_table_ids_for_stream2.insert(table[idx - 1].table_id()); + VerifyTablesInStreamMetadata( + stream_id2, expected_table_ids_for_stream2, + "Waiting for GetDBStreamInfo after disabling dynamic table addition on stream1."); + + // Verify tablets of table_4 have only been added to cdc_state table for stream2. + std::unordered_set expected_tablets_for_stream1; + std::unordered_set expected_tablets_for_stream2; + for (int i = 0; i < idx; i++) { + if (i < 3) { + expected_tablets_for_stream1.insert(tablets[i].Get(0).tablet_id()); + } + expected_tablets_for_stream2.insert(tablets[i].Get(0).tablet_id()); + } + + CheckTabletsInCDCStateTable(expected_tablets_for_stream1, test_client(), stream_id1); + CheckTabletsInCDCStateTable(expected_tablets_for_stream2, test_client(), stream_id2); + + // Even on a master restart, table_4 should not get added to the stream1. + auto leader_master = ASSERT_RESULT(test_cluster_.mini_cluster_->GetLeaderMiniMaster()); + ASSERT_OK(leader_master->Restart()); + LOG(INFO) << "Master Restarted"; + SleepFor(MonoDelta::FromSeconds(5 * kTimeMultiplier)); + + // Any newly created table after master restart should not get added to stream1. + table[idx] = ASSERT_RESULT(CreateTable( + &test_cluster_, kNamespaceName, kTableName, 1, true, false, 0, true, table_list_suffix[idx])); + ASSERT_OK(test_client()->GetTablets( + table[idx], 0, &tablets[idx], /* partition_list_version = */ nullptr)); + idx += 1; + + // wait for the bg thread responsible for dynamic table addition to complete its processing. + SleepFor(MonoDelta::FromSeconds(2 * kTimeMultiplier)); + + // Stream1's metadata should not contain table_5 as dynamic table addition is disabled. + VerifyTablesInStreamMetadata( + stream_id1, expected_table_ids, + "Waiting for GetDBStreamInfo after creating new table on master restart."); + + // Stream2's metadata should contain table_5 as dynamic table addition is not disabled. + expected_table_ids_for_stream2.insert(table[idx - 1].table_id()); + VerifyTablesInStreamMetadata( + stream_id2, expected_table_ids_for_stream2, + "Waiting for GetDBStreamInfo after creating new table on master restart."); + + // verify tablets of table_4 & table_5 have not been added to cdc_state table for stream1. + CheckTabletsInCDCStateTable(expected_tablets_for_stream1, test_client(), stream_id1); + + // Tablets of table_5 should be added to cdc state table for stream2. + expected_tablets_for_stream2.insert(tablets[idx - 1].Get(0).tablet_id()); + CheckTabletsInCDCStateTable(expected_tablets_for_stream2, test_client(), stream_id2); +} + +TEST_F(CDCSDKYsqlTest, TestDisableOfDynamicTableAdditionOnNonConsistentSnapshotStream) { + TestDisableOfDynamicTableAdditionOnCDCStream( + /* use_consistent_snapshot_stream */ false); +} + +TEST_F(CDCSDKYsqlTest, TestDisableOfDynamicTableAdditionOnConsistentSnapshotStream) { + TestDisableOfDynamicTableAdditionOnCDCStream( + /* use_consistent_snapshot_stream */ true); +} + +void CDCSDKYsqlTest::TestUserTableRemovalFromCDCStream(bool use_consistent_snapshot_stream) { + ANNOTATE_UNPROTECTED_WRITE(FLAGS_yb_enable_cdc_consistent_snapshot_streams) = + use_consistent_snapshot_stream; + ANNOTATE_UNPROTECTED_WRITE(FLAGS_update_min_cdc_indices_interval_secs) = 1; + ANNOTATE_UNPROTECTED_WRITE(FLAGS_cdcsdk_enable_dynamic_tables_disable_option) = true; + // Setup cluster. + ASSERT_OK(SetUpWithParams(1, 1, false)); + + const vector table_list_suffix = {"_0", "_1", "_2"}; + const int kNumTables = 3; + vector table(kNumTables); + int idx = 0; + vector> tablets(kNumTables); + + // Create and populate data in the all 3 tables. + for (idx = 0; idx < kNumTables; idx++) { + table[idx] = ASSERT_RESULT(CreateTable( + &test_cluster_, kNamespaceName, kTableName, 1, true, false, 0, true, + table_list_suffix[idx])); + ASSERT_OK(test_client()->GetTablets( + table[idx], 0, &tablets[idx], /* partition_list_version = */ nullptr)); + ASSERT_OK(WriteEnumsRows( + 0 /* start */, 100 /* end */, &test_cluster_, table_list_suffix[idx], kNamespaceName, + kTableName)); + } + + auto stream_id = use_consistent_snapshot_stream + ? ASSERT_RESULT(CreateConsistentSnapshotStream()) + : ASSERT_RESULT(CreateDBStream(CDCCheckpointType::EXPLICIT)); + + // Before we remove a table, get the initial stream metadata as well as cdc state table entries. + std::unordered_set expected_tables; + for (const auto& table_entry : table) { + expected_tables.insert(table_entry.table_id()); + } + + VerifyTablesInStreamMetadata( + stream_id, expected_tables, "Waiting for GetDBStreamInfo after stream creation"); + + std::unordered_set expected_tablets; + for (const auto& tablets_entries : tablets) { + for (const auto& tablet : tablets_entries) { + expected_tablets.insert(tablet.tablet_id()); + } + } + + CheckTabletsInCDCStateTable(expected_tablets, test_client(), stream_id); + + // Disable dynamic table addition on stream via the yb-admin command. + ASSERT_OK(DisableDynamicTableAdditionOnCDCSDKStream(stream_id)); + + // Remove table_1 from stream using yb-admin command. This command will remove table from stream + // metadata as well as update its corresponding state table tablet entries with checkpoint as max. + ASSERT_OK(RemoveUserTableFromCDCSDKStream(stream_id, table[0].table_id())); + SleepFor(MonoDelta::FromSeconds(5 * kTimeMultiplier)); + + // Stream metadata should no longer contain the removed table i.e. table_1. + expected_tables.erase(table[0].table_id()); + std::unordered_set expected_tables_after_table_removal = expected_tables; + VerifyTablesInStreamMetadata( + stream_id, expected_tables_after_table_removal, + "Waiting for GetDBStreamInfo after table removal from CDC stream."); + + // Since checkpoint will be set to max for table_1's tablet entries, wait for + // UpdatePeersAndMetrics to delete those entries. + SleepFor(MonoDelta::FromSeconds(5 * kTimeMultiplier)); + + // Verify tablets of table_1 are removed from cdc_state table. + expected_tablets.clear(); + for (int i = 1; i < idx; i++) { + for (const auto& tablet : tablets[i]) { + expected_tablets.insert(tablet.tablet_id()); + } + } + + CheckTabletsInCDCStateTable(expected_tablets, test_client(), stream_id); + + ASSERT_OK(test_client()->FlushTables( + {table[0].table_id()}, /* add_indexes = */ false, /* timeout_secs = */ 30, + /* is_compaction = */ false)); + + // Split table_1's tablet. + WaitUntilSplitIsSuccesful(tablets[0].Get(0).tablet_id(), table[0], 2); + google::protobuf::RepeatedPtrField table1_tablets_after_split; + ASSERT_OK(test_client()->GetTablets( + table[0], 0, &table1_tablets_after_split, /* partition_list_version =*/nullptr)); + ASSERT_EQ(table1_tablets_after_split.size(), 2); + + // Wait for sometime so that tablet split codepath has completed adding new cdc state entries. + SleepFor(MonoDelta::FromSeconds(3 * kTimeMultiplier)); + + // Children tablets of table_1 shouldnt get added to cdc state table since the table no longer + // exists in stream metadata. + CheckTabletsInCDCStateTable(expected_tablets, test_client(), stream_id); + + auto leader_master = ASSERT_RESULT(test_cluster_.mini_cluster_->GetLeaderMiniMaster()); + ASSERT_OK(leader_master->Restart()); + LOG(INFO) << "Master Restarted"; + + // Even after a restart, we shouldn't see table_1 in stream metadata as well as cdc state table + // entries shouldnt contain any of the table_1 tablets. + VerifyTablesInStreamMetadata( + stream_id, expected_tables_after_table_removal, + "Waiting for GetBStreamInfo after master restart."); + + CheckTabletsInCDCStateTable(expected_tablets, test_client(), stream_id); +} + +TEST_F(CDCSDKYsqlTest, TestUserTableRemovalFromNonConsistentSnapshotCDCStream) { + TestUserTableRemovalFromCDCStream(/* use_consistent_snapshot_stream */ false); +} + +TEST_F(CDCSDKYsqlTest, TestUserTableRemovalFromConsistentSnapshotCDCStream) { + TestUserTableRemovalFromCDCStream(/* use_consistent_snapshot_stream */ true); +} + +void CDCSDKYsqlTest::TestValidationAndSyncOfCDCStateEntriesAfterUserTableRemoval( + bool use_consistent_snapshot_stream) { + ANNOTATE_UNPROTECTED_WRITE(FLAGS_yb_enable_cdc_consistent_snapshot_streams) = + use_consistent_snapshot_stream; + ANNOTATE_UNPROTECTED_WRITE(FLAGS_update_min_cdc_indices_interval_secs) = 1; + ANNOTATE_UNPROTECTED_WRITE(FLAGS_TEST_cdcsdk_skip_updating_cdc_state_entries_on_table_removal) = + true; + ANNOTATE_UNPROTECTED_WRITE(FLAGS_cdcsdk_enable_dynamic_tables_disable_option) = true; + // Setup cluster. + ASSERT_OK(SetUpWithParams(3, 3, false)); + + const vector table_list_suffix = {"_0", "_1", "_2"}; + const int kNumTables = 3; + vector table(kNumTables); + int idx = 0; + vector> tablets(kNumTables); + + // Create and populate data in the all 3 tables. + for (idx = 0; idx < kNumTables; idx++) { + table[idx] = ASSERT_RESULT(CreateTable( + &test_cluster_, kNamespaceName, kTableName, 3, true, false, 0, true, + table_list_suffix[idx])); + ASSERT_OK(test_client()->GetTablets( + table[idx], 0, &tablets[idx], /* partition_list_version = */ nullptr)); + ASSERT_OK(WriteEnumsRows( + 0 /* start */, 100 /* end */, &test_cluster_, table_list_suffix[idx], kNamespaceName, + kTableName)); + } + + auto stream_id = use_consistent_snapshot_stream + ? ASSERT_RESULT(CreateConsistentSnapshotStream()) + : ASSERT_RESULT(CreateDBStream(CDCCheckpointType::EXPLICIT)); + + // Before we remove a table, get the initial stream metadata as well as cdc state table entries. + std::unordered_set expected_tables; + for (const auto& table_entry : table) { + expected_tables.insert(table_entry.table_id()); + } + + VerifyTablesInStreamMetadata( + stream_id, expected_tables, "Waiting for GetDBStreamInfo after stream creation"); + + std::unordered_set expected_tablets; + for (const auto& tablets_entries : tablets) { + for (const auto& tablet : tablets_entries) { + expected_tablets.insert(tablet.tablet_id()); + } + } + + CheckTabletsInCDCStateTable(expected_tablets, test_client(), stream_id); + + // Disable dynamic table addition on stream via the yb-admin command. + ASSERT_OK(DisableDynamicTableAdditionOnCDCSDKStream(stream_id)); + + // Remove table_1 from stream using yb-admin command. This command will remove table from stream + // metadata but skip updating cdc state entries because the test flag + // skip_updating_cdc_state_entries_on_table_removal is set. + ASSERT_OK(RemoveUserTableFromCDCSDKStream(stream_id, table[0].table_id())); + SleepFor(MonoDelta::FromSeconds(5 * kTimeMultiplier)); + + // Stream metadata should no longer contain the removed table i.e. table_1. + expected_tables.erase(table[0].table_id()); + std::unordered_set expected_tables_after_table_removal = expected_tables; + VerifyTablesInStreamMetadata( + stream_id, expected_tables_after_table_removal, + "Waiting for GetDBStreamInfo after table removal from CDC stream."); + + // Verify that cdc state table still contains entries for the table that was removed. + CheckTabletsInCDCStateTable(expected_tablets, test_client(), stream_id); + + // Now, validate the cdc state entries using the yb-admin command + // 'validate_cdc_state_table_entries_on_change_data_stream'. It will find state table entries for + // table_1 and update their checkpoints to max. + ASSERT_OK(ValidateAndSyncCDCStateEntriesForCDCSDKStream(stream_id)); + + // Since checkpoint will be set to max for table_1's tablet entries, wait for + // UpdatePeersAndMetrics to delete those entries. + SleepFor(MonoDelta::FromSeconds(5 * kTimeMultiplier)); + + // Verify tablets of table_1 are removed from cdc_state table. + expected_tablets.clear(); + for (int i = 1; i < idx; i++) { + for (const auto& tablet : tablets[i]) { + expected_tablets.insert(tablet.tablet_id()); + } + } + + CheckTabletsInCDCStateTable(expected_tablets, test_client(), stream_id); +} + +TEST_F( + CDCSDKYsqlTest, + TestValidationAndSyncOfCDCStateEntriesAfterUserTableRemovalOnNonConsistentSnapshotStream) { + TestValidationAndSyncOfCDCStateEntriesAfterUserTableRemoval( + /* use_consistent_snapshot_stream */ false); +} + +TEST_F( + CDCSDKYsqlTest, + TestValidationAndSyncOfCDCStateEntriesAfterUserTableRemovalOnConsistentSnapshotStream) { + TestValidationAndSyncOfCDCStateEntriesAfterUserTableRemoval( + /* use_consistent_snapshot_stream */ true); +} + } // namespace cdc } // namespace yb diff --git a/src/yb/integration-tests/cdcsdk_ysql_test_base.cc b/src/yb/integration-tests/cdcsdk_ysql_test_base.cc index c71dfe216e6f..997d5af15fdf 100644 --- a/src/yb/integration-tests/cdcsdk_ysql_test_base.cc +++ b/src/yb/integration-tests/cdcsdk_ysql_test_base.cc @@ -2043,6 +2043,27 @@ namespace cdc { return get_resp; } + void CDCSDKYsqlTest::VerifyTablesInStreamMetadata( + const xrepl::StreamId& stream_id, const std::unordered_set& expected_table_ids, + const std::string& timeout_msg) { + ASSERT_OK(WaitFor( + [&]() -> Result { + auto get_resp = GetDBStreamInfo(stream_id); + if (get_resp.ok() && !get_resp->has_error()) { + const uint64_t table_info_size = get_resp->table_info_size(); + if (table_info_size == expected_table_ids.size()) { + std::unordered_set table_ids; + for (auto entry : get_resp->table_info()) { + table_ids.insert(entry.table_id()); + } + if (expected_table_ids == table_ids) return true; + } + } + return false; + }, + MonoDelta::FromSeconds(60), timeout_msg)); + } + Status CDCSDKYsqlTest::ChangeLeaderOfTablet(size_t new_leader_index, const TabletId tablet_id) { CHECK(!FLAGS_enable_load_balancing); @@ -3674,5 +3695,53 @@ namespace cdc { } + Status CDCSDKYsqlTest::ExecuteYBAdminCommand( + const std::string& command_name, const std::vector& command_args) { + string tool_path = GetToolPath("../bin", "yb-admin"); + vector argv; + argv.push_back(tool_path); + argv.push_back("--master_addresses"); + argv.push_back(AsString(test_cluster_.mini_cluster_->GetMasterAddresses())); + argv.push_back(command_name); + for (const auto& command_arg : command_args) { + argv.push_back(command_arg); + } + + RETURN_NOT_OK(Subprocess::Call(argv)); + + return Status::OK(); + } + + Status CDCSDKYsqlTest::DisableDynamicTableAdditionOnCDCSDKStream( + const xrepl::StreamId& stream_id) { + std::string yb_admin_command = "disable_dynamic_table_addition_on_change_data_stream"; + vector command_args; + command_args.push_back(stream_id.ToString()); + RETURN_NOT_OK(ExecuteYBAdminCommand(yb_admin_command, command_args)); + return Status::OK(); + } + + Status CDCSDKYsqlTest::RemoveUserTableFromCDCSDKStream( + const xrepl::StreamId& stream_id, const TableId& table_id) { + std::string yb_admin_command = "remove_user_table_from_change_data_stream"; + vector command_args; + command_args.push_back(stream_id.ToString()); + command_args.push_back(table_id); + RETURN_NOT_OK(ExecuteYBAdminCommand(yb_admin_command, command_args)); + + return Status::OK(); + } + + Status CDCSDKYsqlTest::ValidateAndSyncCDCStateEntriesForCDCSDKStream( + const xrepl::StreamId& stream_id) { + std::string yb_admin_command = + "validate_and_sync_cdc_state_table_entries_on_change_data_stream"; + vector command_args; + command_args.push_back(stream_id.ToString()); + RETURN_NOT_OK(ExecuteYBAdminCommand(yb_admin_command, command_args)); + + return Status::OK(); + } + } // namespace cdc } // namespace yb diff --git a/src/yb/integration-tests/cdcsdk_ysql_test_base.h b/src/yb/integration-tests/cdcsdk_ysql_test_base.h index 2f7c87c2e2cc..148efa1606a8 100644 --- a/src/yb/integration-tests/cdcsdk_ysql_test_base.h +++ b/src/yb/integration-tests/cdcsdk_ysql_test_base.h @@ -135,6 +135,8 @@ DECLARE_bool(enable_log_retention_by_op_idx); DECLARE_bool(yb_enable_cdc_consistent_snapshot_streams); DECLARE_uint32(cdcsdk_tablet_not_of_interest_timeout_secs); DECLARE_uint32(cdcsdk_retention_barrier_no_revision_interval_secs); +DECLARE_bool(cdcsdk_enable_dynamic_tables_disable_option); +DECLARE_bool(TEST_cdcsdk_skip_updating_cdc_state_entries_on_table_removal); namespace yb { @@ -495,6 +497,10 @@ class CDCSDKYsqlTest : public CDCSDKTestBase { Result GetDBStreamInfo(const xrepl::StreamId db_stream_id); + void VerifyTablesInStreamMetadata( + const xrepl::StreamId& stream_id, const std::unordered_set& expected_table_ids, + const std::string& timeout_msg); + Status ChangeLeaderOfTablet(size_t new_leader_index, const TabletId tablet_id); Status CreateSnapshot(const NamespaceName& ns); @@ -643,6 +649,22 @@ class CDCSDKYsqlTest : public CDCSDKTestBase { CDCSDKCheckpointPB checkpoint, GetChangesResponsePB* change_resp); void TestNonUserTableShouldNotGetAddedToCDCStream (bool create_consistent_snapshot_stream); + + Status ExecuteYBAdminCommand( + const std::string& command_name, const std::vector& command_args); + + Status DisableDynamicTableAdditionOnCDCSDKStream(const xrepl::StreamId& stream_id); + + void TestDisableOfDynamicTableAdditionOnCDCStream(bool use_consistent_snapshot_stream); + + Status RemoveUserTableFromCDCSDKStream(const xrepl::StreamId& stream_id, const TableId& table_id); + + void TestUserTableRemovalFromCDCStream(bool use_consistent_snapshot_stream); + + Status ValidateAndSyncCDCStateEntriesForCDCSDKStream(const xrepl::StreamId& stream_id); + + void TestValidationAndSyncOfCDCStateEntriesAfterUserTableRemoval( + bool use_consistent_snapshot_stream); }; } // namespace cdc diff --git a/src/yb/master/catalog_entity_info.cc b/src/yb/master/catalog_entity_info.cc index fccad8905341..bc490e87e5ce 100644 --- a/src/yb/master/catalog_entity_info.cc +++ b/src/yb/master/catalog_entity_info.cc @@ -59,6 +59,7 @@ using std::string; using strings::Substitute; DECLARE_int32(tserver_unresponsive_timeout_ms); +DECLARE_bool(cdcsdk_enable_dynamic_tables_disable_option); DEFINE_RUNTIME_AUTO_bool( use_parent_table_id_field, kLocalPersisted, false, true, @@ -1282,6 +1283,11 @@ const NamespaceId CDCStreamInfo::namespace_id() const { return LockForRead()->pb.namespace_id(); } +bool CDCStreamInfo::IsCDCSDKStream() const { + auto l = LockForRead(); + return l->pb.has_namespace_id() && !l->pb.namespace_id().empty(); +} + const ReplicationSlotName CDCStreamInfo::GetCdcsdkYsqlReplicationSlotName() const { auto l = LockForRead(); return ReplicationSlotName(l->pb.cdcsdk_ysql_replication_slot_name()); @@ -1293,6 +1299,16 @@ bool CDCStreamInfo::IsConsistentSnapshotStream() const { l->pb.cdcsdk_stream_metadata().has_consistent_snapshot_option(); } +bool CDCStreamInfo::IsDynamicTableAdditionDisabled() const { + if (!FLAGS_cdcsdk_enable_dynamic_tables_disable_option) { + return false; + } + + auto l = LockForRead(); + return l->pb.has_cdcsdk_disable_dynamic_table_addition() && + l->pb.cdcsdk_disable_dynamic_table_addition(); +} + std::string CDCStreamInfo::ToString() const { auto l = LockForRead(); if (l->pb.has_namespace_id()) { diff --git a/src/yb/master/catalog_entity_info.h b/src/yb/master/catalog_entity_info.h index 03aefb35f834..2655438f79d4 100644 --- a/src/yb/master/catalog_entity_info.h +++ b/src/yb/master/catalog_entity_info.h @@ -1258,6 +1258,10 @@ class CDCStreamInfo : public RefCountedThreadSafe, bool IsConsistentSnapshotStream() const; + bool IsCDCSDKStream() const; + + bool IsDynamicTableAdditionDisabled() const; + std::string ToString() const override; private: diff --git a/src/yb/master/catalog_entity_info.proto b/src/yb/master/catalog_entity_info.proto index 4783cbfdff69..af4db43db75c 100644 --- a/src/yb/master/catalog_entity_info.proto +++ b/src/yb/master/catalog_entity_info.proto @@ -519,6 +519,11 @@ message SysCDCStreamEntryPB { optional string cdcsdk_ysql_replication_slot_name = 6; optional CDCSDKStreamEntryPB cdcsdk_stream_metadata = 7; optional uint64 stream_creation_time = 8; + + // Dynamic tables are the tables which are created after the creation of the stream. + // This field controls if dynamic tables should automatically be added to the CDC stream or not. + // If set to true, dynamic table wont get added to the CDC stream. + optional bool cdcsdk_disable_dynamic_table_addition = 11; } diff --git a/src/yb/master/catalog_manager.h b/src/yb/master/catalog_manager.h index b9cf2d7520c7..ecff1f341d93 100644 --- a/src/yb/master/catalog_manager.h +++ b/src/yb/master/catalog_manager.h @@ -44,6 +44,7 @@ #include #include +#include "yb/cdc/cdc_state_table.h" #include "yb/cdc/xcluster_types.h" #include "yb/common/constants.h" #include "yb/common/entity_ids.h" @@ -1311,6 +1312,18 @@ class CatalogManager : public tserver::TabletPeerLookupIf, Status UpdateCDCStream( const UpdateCDCStreamRequestPB* req, UpdateCDCStreamResponsePB* resp, rpc::RpcContext* rpc); + Status DisableDynamicTableAdditionOnCDCSDKStream( + const DisableDynamicTableAdditionOnCDCSDKStreamRequestPB* req, + DisableDynamicTableAdditionOnCDCSDKStreamResponsePB* resp, rpc::RpcContext* rpc); + + Status RemoveUserTableFromCDCSDKStream( + const RemoveUserTableFromCDCSDKStreamRequestPB* req, + RemoveUserTableFromCDCSDKStreamResponsePB* resp, rpc::RpcContext* rpc); + + Status ValidateAndSyncCDCStateEntriesForCDCSDKStream( + const ValidateAndSyncCDCStateEntriesForCDCSDKStreamRequestPB* req, + ValidateAndSyncCDCStateEntriesForCDCSDKStreamResponsePB* resp, rpc::RpcContext* rpc); + // Query if Bootstrapping is required for a CDC stream (e.g. Are we missing logs). Status IsBootstrapRequired( const IsBootstrapRequiredRequestPB* req, @@ -1439,7 +1452,7 @@ class CatalogManager : public tserver::TabletPeerLookupIf, // Find all CDCSDK streams which do not have metadata for the newly added tables. Status FindCDCSDKStreamsForAddedTables(TableStreamIdsMap* table_to_unprocessed_streams_map); - bool CanTableBeAddedToCDCSDKStream( + bool IsTableEligibleForCDCSDKStream( const TableInfoPtr& table_info, const Schema& schema) const REQUIRES_SHARED(mutex_); // This method compares all tables in the namespace to all the tables added to a CDCSDK stream, @@ -3103,6 +3116,14 @@ class CatalogManager : public tserver::TabletPeerLookupIf, void ValidateIndexTablesPostLoad(std::unordered_map&& indexes_map, TableIdSet* tables_to_persist) EXCLUDES(mutex_); + Result> UpdateCheckpointForTabletEntriesInCDCState( + const xrepl::StreamId& stream_id, + const std::unordered_set& tables_in_stream_metadata, + const TableId& table_to_be_removed = ""); + + Status RemoveTableFromCDCStreamMetadataAndMaps( + const CDCStreamInfoPtr stream, const TableId table_id); + // Should be bumped up when tablet locations are changed. std::atomic tablet_locations_version_{0}; diff --git a/src/yb/master/master_replication.proto b/src/yb/master/master_replication.proto index bd9347f747d9..8fa75e49061a 100644 --- a/src/yb/master/master_replication.proto +++ b/src/yb/master/master_replication.proto @@ -36,6 +36,11 @@ message CDCStreamInfoPB { optional uint64 cdcsdk_consistent_snapshot_time = 7; optional CDCSDKSnapshotOption cdcsdk_consistent_snapshot_option = 8; optional uint64 stream_creation_time = 9; + + // Dynamic tables are the tables which are created after the creation of the stream. + // This field controls if dynamic tables should automatically be added to the CDC stream or not. + // If set to true, dynamic table wont get added to the CDC stream. + optional bool cdcsdk_disable_dynamic_table_addition = 12; } message ValidateReplicationInfoRequestPB { @@ -498,6 +503,32 @@ message XClusterReportNewAutoFlagConfigVersionResponsePB { optional MasterErrorPB error = 1; } +message DisableDynamicTableAdditionOnCDCSDKStreamRequestPB { + optional string stream_id = 1; +} + +message DisableDynamicTableAdditionOnCDCSDKStreamResponsePB { + optional MasterErrorPB error = 1; +} + +message RemoveUserTableFromCDCSDKStreamRequestPB { + optional string stream_id = 1; + optional string table_id = 2; +} + +message RemoveUserTableFromCDCSDKStreamResponsePB { + optional MasterErrorPB error = 1; +} + +message ValidateAndSyncCDCStateEntriesForCDCSDKStreamRequestPB { + optional string stream_id = 1; +} + +message ValidateAndSyncCDCStateEntriesForCDCSDKStreamResponsePB { + optional MasterErrorPB error = 1; + repeated string updated_tablet_entries = 2; +} + service MasterReplication { option (yb.rpc.custom_service_name) = "yb.master.MasterService"; @@ -563,4 +594,15 @@ service MasterReplication { rpc XClusterReportNewAutoFlagConfigVersion( XClusterReportNewAutoFlagConfigVersionRequestPB) returns (XClusterReportNewAutoFlagConfigVersionResponsePB); + + // Introduced for bug (#22876, #22773) + rpc DisableDynamicTableAdditionOnCDCSDKStream (DisableDynamicTableAdditionOnCDCSDKStreamRequestPB) + returns (DisableDynamicTableAdditionOnCDCSDKStreamResponsePB); + // Introduced for bug (#22876, #22773) + rpc RemoveUserTableFromCDCSDKStream (RemoveUserTableFromCDCSDKStreamRequestPB) + returns (RemoveUserTableFromCDCSDKStreamResponsePB); + // Introduced for bug (#22876, #22773) + rpc ValidateAndSyncCDCStateEntriesForCDCSDKStream( + ValidateAndSyncCDCStateEntriesForCDCSDKStreamRequestPB) + returns (ValidateAndSyncCDCStateEntriesForCDCSDKStreamResponsePB); } diff --git a/src/yb/master/master_replication_service.cc b/src/yb/master/master_replication_service.cc index b152f6c9149c..f3bcc73cc929 100644 --- a/src/yb/master/master_replication_service.cc +++ b/src/yb/master/master_replication_service.cc @@ -56,6 +56,9 @@ class MasterReplicationServiceImpl : public MasterServiceBase, public MasterRepl (GetTableSchemaFromSysCatalog) (ChangeXClusterRole) (BootstrapProducer) + (DisableDynamicTableAdditionOnCDCSDKStream) + (RemoveUserTableFromCDCSDKStream) + (ValidateAndSyncCDCStateEntriesForCDCSDKStream) ) MASTER_SERVICE_IMPL_ON_LEADER_WITH_LOCK( diff --git a/src/yb/master/xrepl_catalog_manager.cc b/src/yb/master/xrepl_catalog_manager.cc index 5378f2307ba9..2acfec7b82b1 100644 --- a/src/yb/master/xrepl_catalog_manager.cc +++ b/src/yb/master/xrepl_catalog_manager.cc @@ -135,6 +135,22 @@ DEFINE_test_flag(bool, fail_universe_replication_merge, false, "Causes MergeUniv DEFINE_test_flag(bool, xcluster_fail_setup_stream_update, false, "Fail UpdateCDCStream RPC call"); +DEFINE_RUNTIME_AUTO_bool(cdcsdk_enable_dynamic_tables_disable_option, + kLocalPersisted, + false, + true, + "This flag needs to be true in order to disable addition of dynamic tables " + "to CDC stream. This flag is required to be to true for execution of " + "yb-admin commands - " + "\'disable_dynamic_table_addition_on_change_data_stream\', " + "\'remove_user_table_from_change_data_stream\'"); +TAG_FLAG(cdcsdk_enable_dynamic_tables_disable_option, advanced); +TAG_FLAG(cdcsdk_enable_dynamic_tables_disable_option, hidden); + +DEFINE_test_flag(bool, cdcsdk_skip_updating_cdc_state_entries_on_table_removal, false, + "Skip updating checkpoint to max for cdc state table entries while removing a user table from " + "CDCSDK stream."); + DECLARE_bool(xcluster_wait_on_ddl_alter); DECLARE_int32(master_rpc_timeout_ms); DECLARE_bool(enable_xcluster_auto_flag_validation); @@ -1543,6 +1559,11 @@ Status CatalogManager::FindCDCSDKStreamsForAddedTables( continue; } + // skip streams on which dynamic table addition is disabled. + if(stream_info->IsDynamicTableAdditionDisabled()) { + continue; + } + auto const unprocessed_tables = FindOrNull(namespace_to_unprocessed_table_map, stream_info->namespace_id()); if (!unprocessed_tables) { @@ -1565,7 +1586,7 @@ Status CatalogManager::FindCDCSDKStreamsForAddedTables( continue; } - if (!CanTableBeAddedToCDCSDKStream(table, schema)) { + if (!IsTableEligibleForCDCSDKStream(table, schema)) { RemoveTableFromCDCSDKUnprocessedMap(unprocessed_table_id, stream_info->namespace_id()); continue; } @@ -1660,7 +1681,7 @@ std::vector CatalogManager::FindAllTablesForCDCSDK(const Namespace } } - if (!CanTableBeAddedToCDCSDKStream(table_info.get(), schema)) { + if (!IsTableEligibleForCDCSDKStream(table_info.get(), schema)) { continue; } @@ -1670,7 +1691,7 @@ std::vector CatalogManager::FindAllTablesForCDCSDK(const Namespace return tables; } -bool CatalogManager::CanTableBeAddedToCDCSDKStream( +bool CatalogManager::IsTableEligibleForCDCSDKStream( const TableInfoPtr& table_info, const Schema& schema) const { bool has_pk = true; for (const auto& col : schema.columns()) { @@ -2212,6 +2233,12 @@ Status CatalogManager::GetCDCStream( stream_info->set_stream_creation_time(stream_lock->pb.stream_creation_time()); } + if (FLAGS_cdcsdk_enable_dynamic_tables_disable_option && + stream_lock->pb.has_cdcsdk_disable_dynamic_table_addition()) { + stream_info->set_cdcsdk_disable_dynamic_table_addition( + stream_lock->pb.cdcsdk_disable_dynamic_table_addition()); + } + return Status::OK(); } @@ -2337,6 +2364,11 @@ Status CatalogManager::ListCDCStreams( stream->set_stream_creation_time(ltm->pb.stream_creation_time()); } + if (FLAGS_cdcsdk_enable_dynamic_tables_disable_option && + ltm->pb.has_cdcsdk_disable_dynamic_table_addition()) { + stream->set_cdcsdk_disable_dynamic_table_addition( + ltm->pb.cdcsdk_disable_dynamic_table_addition()); + } } return Status::OK(); } @@ -5867,6 +5899,232 @@ Status CatalogManager::GetReplicationStatus( return Status::OK(); } + +Status CatalogManager::DisableDynamicTableAdditionOnCDCSDKStream( + const DisableDynamicTableAdditionOnCDCSDKStreamRequestPB* req, + DisableDynamicTableAdditionOnCDCSDKStreamResponsePB* resp, rpc::RpcContext* rpc) { + LOG(INFO) << "Servicing DisableDynamicTableAdditionOnCDCSDKStream request from " + << RequestorString(rpc) << ": " << req->ShortDebugString(); + + if (!req->has_stream_id()) { + RETURN_INVALID_REQUEST_STATUS("CDC Stream ID must be provided", (*req)); + } + + if (!FLAGS_cdcsdk_enable_dynamic_tables_disable_option) { + RETURN_INVALID_REQUEST_STATUS( + "Disabling addition of dynamic tables to CDC stream is disallowed in the middle of an " + "upgrade. Finalize the upgrade and try again", (*req)); + } + + auto stream_id = VERIFY_RESULT(xrepl::StreamId::FromString(req->stream_id())); + + CDCStreamInfoPtr stream; + { + SharedLock lock(mutex_); + stream = FindPtrOrNull(cdc_stream_map_, stream_id); + } + + if (stream == nullptr || stream->LockForRead()->is_deleting()) { + return STATUS( + NotFound, "Could not find CDC stream", MasterError(MasterErrorPB::OBJECT_NOT_FOUND)); + } + + if (!stream->IsCDCSDKStream()) { + RETURN_INVALID_REQUEST_STATUS("Not a CDC stream", (*req)); + } + + // We only want to allow disabling dynamic table addition on older streams that are not associated + // with a replication slot. + if (!stream->GetCdcsdkYsqlReplicationSlotName().empty()) { + RETURN_INVALID_REQUEST_STATUS( + "Cannot disable dynamic table addition on CDC streams associated with a replication slot", + (*req)); + } + + if (stream->IsDynamicTableAdditionDisabled()) { + return STATUS(AlreadyPresent, "Dynamic table addition already disabled on the CDC stream"); + } + + // Disable dynamic table addition by setting the stream metadata field to true. + { + auto stream_lock = stream->LockForWrite(); + auto& pb = stream_lock.mutable_data()->pb; + + pb.set_cdcsdk_disable_dynamic_table_addition(true); + + RETURN_ACTION_NOT_OK( + sys_catalog_->Upsert(leader_ready_term(), stream), "Updating CDC stream in system catalog"); + + stream_lock.Commit(); + } + + LOG_WITH_FUNC(INFO) << "Successfully disabled dynamic table addition on CDC stream: " + << stream_id; + + return Status::OK(); +} + +Status CatalogManager::RemoveUserTableFromCDCSDKStream( + const RemoveUserTableFromCDCSDKStreamRequestPB* req, + RemoveUserTableFromCDCSDKStreamResponsePB* resp, rpc::RpcContext* rpc) { + LOG(INFO) << "Servicing RemoveUserTableFromCDCSDKStream request from " << RequestorString(rpc) + << ": " << req->ShortDebugString(); + + if (!req->has_stream_id() || !req->has_table_id()) { + RETURN_INVALID_REQUEST_STATUS("Both CDC Stream ID and table ID must be provided", (*req)); + } + + if (!FLAGS_cdcsdk_enable_dynamic_tables_disable_option) { + RETURN_INVALID_REQUEST_STATUS( + "Removal of user table from CDC stream is disallowed in the middle of an " + "upgrade. Finalize the upgrade and try again", (*req)); + } + + auto stream_id = VERIFY_RESULT(xrepl::StreamId::FromString(req->stream_id())); + auto table_id = req->table_id(); + + CDCStreamInfoPtr stream; + { + SharedLock lock(mutex_); + stream = FindPtrOrNull(cdc_stream_map_, stream_id); + } + + if (stream == nullptr || stream->LockForRead()->is_deleting()) { + return STATUS( + NotFound, "Could not find CDC stream", MasterError(MasterErrorPB::OBJECT_NOT_FOUND)); + } + + if (!stream->IsCDCSDKStream()) { + RETURN_INVALID_REQUEST_STATUS("Not a CDC stream", (*req)); + } + + if (!stream->GetCdcsdkYsqlReplicationSlotName().empty()) { + RETURN_INVALID_REQUEST_STATUS( + "Cannot remove table from CDC streams that are associated with a replication slot", (*req)); + } + + if (!stream->IsDynamicTableAdditionDisabled()) { + RETURN_INVALID_REQUEST_STATUS( + "Cannot remove table unless dynamic table addition is disabled for the stream. Please use " + "the yb-admin command \"disable_dynamic_table_addition_in_change_data_stream\" to disable " + "dynamic table addition on the stream.", (*req)); + } + + auto stream_ns_id = stream->LockForRead()->namespace_id(); + + scoped_refptr table; + { + SharedLock lock(mutex_); + table = tables_->FindTableOrNull(table_id); + } + + if (table == nullptr || table->LockForRead()->is_deleting()) { + return STATUS(NotFound, "Could not find table", MasterError(MasterErrorPB::OBJECT_NOT_FOUND)); + } + + Schema schema; + Status status = table->GetSchema(&schema); + if (!status.ok()) { + return STATUS(InternalError, Format("Error while getting schema for table: $0", table->name())); + } + + { + SharedLock lock(mutex_); + if (!IsTableEligibleForCDCSDKStream(table, schema)) { + RETURN_INVALID_REQUEST_STATUS( + "Only allowed to remove user tables from CDC streams via this command.", (*req)); + } + } + + auto table_ns_id = table->LockForRead()->namespace_id(); + if (table_ns_id != stream_ns_id) { + RETURN_INVALID_REQUEST_STATUS("Stream and Table are not under the same namespace", (*req)); + } + + if (!FLAGS_TEST_cdcsdk_skip_updating_cdc_state_entries_on_table_removal) { + std::unordered_set tables_in_stream_metadata; + { + auto stream_lock = stream->LockForRead(); + for (const auto& table_id : stream_lock->table_id()) { + tables_in_stream_metadata.insert(table_id); + } + } + + // Explicitly remove the table from the set since we want to remove the tablet entries of this + // table from the cdc state table. + tables_in_stream_metadata.erase(table_id); + RETURN_NOT_OK_PREPEND( + UpdateCheckpointForTabletEntriesInCDCState(stream_id, tables_in_stream_metadata), + "Error updating tablet entries from cdc state table"); + } + + // Now remove the table from the CDC stream metadata & cdcsdk_tables_to_stream_map_ and persist + // the updated metadata. + RETURN_NOT_OK_PREPEND( + RemoveTableFromCDCStreamMetadataAndMaps(stream, table_id), + "Error removing table from stream metadata and maps"); + + LOG_WITH_FUNC(INFO) + << "Successfully removed table " << table_id << " from CDC stream: " << stream_id + << " and updated the checkpoint to max for corresponding cdc state table entries."; + + return Status::OK(); +} + +Status CatalogManager::ValidateAndSyncCDCStateEntriesForCDCSDKStream( + const ValidateAndSyncCDCStateEntriesForCDCSDKStreamRequestPB* req, + ValidateAndSyncCDCStateEntriesForCDCSDKStreamResponsePB* resp, rpc::RpcContext* rpc) { + LOG(INFO) << "Servicing ValidateAndSyncCDCStateEntriesForCDCSDKStream request from " + << RequestorString(rpc) << ": " << req->ShortDebugString(); + + if (!req->has_stream_id()) { + RETURN_INVALID_REQUEST_STATUS("CDC Stream ID must be provided", (*req)); + } + + auto stream_id = VERIFY_RESULT(xrepl::StreamId::FromString(req->stream_id())); + CDCStreamInfoPtr stream; + { + SharedLock lock(mutex_); + stream = FindPtrOrNull(cdc_stream_map_, stream_id); + } + + if (stream == nullptr || stream->LockForRead()->is_deleting()) { + return STATUS( + NotFound, "Could not find CDC stream", MasterError(MasterErrorPB::OBJECT_NOT_FOUND)); + } + + if (!stream->IsCDCSDKStream()) { + RETURN_INVALID_REQUEST_STATUS("Not a CDC stream", (*req)); + } + + if (!stream->GetCdcsdkYsqlReplicationSlotName().empty()) { + RETURN_INVALID_REQUEST_STATUS( + "Cannot validate and sync cdc state table entries for CDC streams that are associated with " + "a replication slot", (*req)); + } + + std::unordered_set tables_in_stream_metadata; + { + auto stream_lock = stream->LockForRead(); + tables_in_stream_metadata.reserve(stream_lock->table_id().size()); + for (const auto& table_id : stream_lock->table_id()) { + tables_in_stream_metadata.insert(table_id); + } + } + + auto updated_state_table_entries = VERIFY_RESULT( + UpdateCheckpointForTabletEntriesInCDCState(stream_id, tables_in_stream_metadata)); + + for (const auto& entry : updated_state_table_entries) { + resp->add_updated_tablet_entries(entry.key.tablet_id); + } + + LOG_WITH_FUNC(INFO) + << "Successfully validated and synced cdc state table entries for CDC stream: " << stream_id; + + return Status::OK(); +} + Status CatalogManager::TEST_CDCSDKFailCreateStreamRequestIfNeeded(const std::string& sync_point) { bool fail_create_cdc_stream_request = false; TEST_SYNC_POINT_CALLBACK(sync_point, &fail_create_cdc_stream_request); @@ -7432,5 +7690,123 @@ Status CatalogManager::XClusterRefreshLocalAutoFlagConfig(const LeaderEpoch& epo return Status::OK(); } +Result> +CatalogManager::UpdateCheckpointForTabletEntriesInCDCState( + const xrepl::StreamId& stream_id, const std::unordered_set& tables_in_stream_metadata, + const TableId& table_to_be_removed) { + std::unordered_set tablet_entries_to_be_removed; + + // If the table_id to be removed is provided, we will only find out cdc state table entries + // corresponding to this table and update their checkpoints. Otherwise, we'll consider all state + // table entries for checkpoint update. + if (!table_to_be_removed.empty()) { + scoped_refptr table; + { + SharedLock lock(mutex_); + table = tables_->FindTableOrNull(table_to_be_removed); + } + + // First we'll update the checkpoint to OpId max for all the cdc state entries correponding to + // the table. Therefore, get all the tablets for the table to be removed. + TabletInfos tablets; + tablets = table->GetTablets(IncludeInactive::kTrue); + + for (const auto& tablet : tablets) { + tablet_entries_to_be_removed.insert(tablet->tablet_id()); + } + } + + Status iteration_status; + auto all_entry_keys = + VERIFY_RESULT(cdc_state_table_->GetTableRange({} /* just key columns */, &iteration_status)); + std::vector entries_to_update; + // Get all the tablet, stream pairs from cdc_state for the given stream. + std::vector cdc_state_tablet_entries; + for (const auto& entry_result : all_entry_keys) { + RETURN_NOT_OK(entry_result); + const auto& entry = *entry_result; + + if (entry.key.stream_id == stream_id) { + // If table_id is provided, filter out state entries belonging to tablets of the table. + if (table_to_be_removed.empty() || + (!table_to_be_removed.empty() && + tablet_entries_to_be_removed.contains(entry.key.tablet_id))) { + cdc_state_tablet_entries.push_back(entry.key.tablet_id); + } + } + } + RETURN_NOT_OK(iteration_status); + + // Get the tablet info for state table entries of the stream. + auto tablet_infos = GetTabletInfos(cdc_state_tablet_entries); + + // For each state table entry present in cdc_state_tablet_entries, verify that the tablet's table + // is present in the CDC stream metadata. If not, update checkpoint of such tablet entries to + // OpId::Max. For colocated tables, even if one of the colocated table is present in the CDC + // stream metadata, skip updating the checkpoint for that tablet, stream pair. + for (const auto& tablet_info : tablet_infos) { + bool table_found = false; + for (const auto& table_id : tablet_info->GetTableIds()) { + if (tables_in_stream_metadata.contains(table_id)) { + table_found = true; + } + } + + if (!table_found) { + cdc::CDCStateTableEntry update_entry(tablet_info->tablet_id(), stream_id); + update_entry.checkpoint = OpId::Max(); + entries_to_update.emplace_back(std::move(update_entry)); + LOG_WITH_FUNC(INFO) + << "Setting checkpoint to OpId::Max() for cdc state table entry (tablet,stream) - " + << update_entry.ToString(); + } + } + + if (!entries_to_update.empty()) { + LOG_WITH_FUNC(INFO) + << "Updating checkpoint to max for " << entries_to_update.size() + << " cdc state entries as part of validating cdc state table entries for CDC stream: " + << stream_id; + RETURN_NOT_OK_PREPEND( + cdc_state_table_->UpdateEntries(entries_to_update), + "Error setting checkpoint to OpId::Max() in cdc_state table"); + } + + return entries_to_update; +} + +Status CatalogManager::RemoveTableFromCDCStreamMetadataAndMaps( + const CDCStreamInfoPtr stream, const TableId table_id) { + // Remove the table from the CDC stream metadata & cdcsdk_tables_to_stream_map_ and persist + // the updated metadata. + { + auto ltm = stream->LockForWrite(); + bool need_to_update_stream = false; + + auto table_id_iter = std::find(ltm->table_id().begin(), ltm->table_id().end(), table_id); + if (table_id_iter != ltm->table_id().end()) { + need_to_update_stream = true; + ltm.mutable_data()->pb.mutable_table_id()->erase(table_id_iter); + } + + if (need_to_update_stream) { + RETURN_ACTION_NOT_OK( + sys_catalog_->Upsert(leader_ready_term(), stream), + "Updating CDC streams in system catalog"); + } + + ltm.Commit(); + + if (need_to_update_stream) { + { + LockGuard lock(mutex_); + cdcsdk_tables_to_stream_map_[table_id].erase(stream->StreamId()); + } + } + } + + return Status::OK(); +} + } // namespace master } // namespace yb diff --git a/src/yb/tools/yb-admin_cli.cc b/src/yb/tools/yb-admin_cli.cc index e6e4d16c651c..53cceb4d2ffc 100644 --- a/src/yb/tools/yb-admin_cli.cc +++ b/src/yb/tools/yb-admin_cli.cc @@ -1846,6 +1846,50 @@ Status get_change_data_stream_info_action( return Status::OK(); } +const auto disable_dynamic_table_addition_on_change_data_stream_args = ""; +Status disable_dynamic_table_addition_on_change_data_stream_action( + const ClusterAdminCli::CLIArguments& args, ClusterAdminClient* client) { + if (args.size() != 1) { + return ClusterAdminCli::kInvalidArguments; + } + + const string stream_id = args[0]; + string msg = Format("Failed to disable dynamic table addition on CDC stream $0", stream_id); + + RETURN_NOT_OK_PREPEND(client->DisableDynamicTableAdditionOnCDCSDKStream(stream_id), msg); + return Status::OK(); +} + +const auto remove_user_table_from_change_data_stream_args = " "; +Status remove_user_table_from_change_data_stream_action( + const ClusterAdminCli::CLIArguments& args, ClusterAdminClient* client) { + if (args.size() != 2) { + return ClusterAdminCli::kInvalidArguments; + } + + const string stream_id = args[0]; + const string table_id = args[1]; + string msg = Format("Failed to remove table $0 from CDC stream $1", table_id, stream_id); + + RETURN_NOT_OK_PREPEND(client->RemoveUserTableFromCDCSDKStream(stream_id, table_id), msg); + return Status::OK(); +} + +const auto validate_and_sync_cdc_state_table_entries_on_change_data_stream_args = ""; +Status validate_and_sync_cdc_state_table_entries_on_change_data_stream_action( + const ClusterAdminCli::CLIArguments& args, ClusterAdminClient* client) { + if (args.size() != 1) { + return ClusterAdminCli::kInvalidArguments; + } + + const string stream_id = args[0]; + string msg = + Format("Failed to validate and sync cdc state table entries for CDC stream $0", stream_id); + + RETURN_NOT_OK_PREPEND(client->ValidateAndSyncCDCStateEntriesForCDCSDKStream(stream_id), msg); + return Status::OK(); +} + const auto setup_universe_replication_args = " " " [] " @@ -2251,6 +2295,9 @@ void ClusterAdminCli::RegisterCommandHandlers() { REGISTER_COMMAND(list_cdc_streams); REGISTER_COMMAND(list_change_data_streams); REGISTER_COMMAND(get_change_data_stream_info); + REGISTER_COMMAND(disable_dynamic_table_addition_on_change_data_stream); + REGISTER_COMMAND(remove_user_table_from_change_data_stream); + REGISTER_COMMAND(validate_and_sync_cdc_state_table_entries_on_change_data_stream); REGISTER_COMMAND(setup_universe_replication); REGISTER_COMMAND(delete_universe_replication); REGISTER_COMMAND(alter_universe_replication); diff --git a/src/yb/tools/yb-admin_client.cc b/src/yb/tools/yb-admin_client.cc index 158b5f557c4a..acc56476fe99 100644 --- a/src/yb/tools/yb-admin_client.cc +++ b/src/yb/tools/yb-admin_client.cc @@ -3915,6 +3915,84 @@ Status ClusterAdminClient::GetCDCDBStreamInfo(const std::string& db_stream_id) { return Status::OK(); } +Status ClusterAdminClient::DisableDynamicTableAdditionOnCDCSDKStream(const std::string& stream_id) { + master::DisableDynamicTableAdditionOnCDCSDKStreamRequestPB req; + master::DisableDynamicTableAdditionOnCDCSDKStreamResponsePB resp; + + req.set_stream_id(stream_id); + + RpcController rpc; + rpc.set_timeout(timeout_); + RETURN_NOT_OK( + master_replication_proxy_->DisableDynamicTableAdditionOnCDCSDKStream(req, &resp, &rpc)); + + if (resp.has_error()) { + cout << "Error disabling dynamic table addition from CDC stream: " + << resp.error().status().message() << endl; + return StatusFromPB(resp.error().status()); + } + + cout << "Successfully disabled dynamic table addition on CDC stream: " << stream_id << "\n"; + + return Status::OK(); +} + +Status ClusterAdminClient::RemoveUserTableFromCDCSDKStream( + const std::string& stream_id, const std::string& table_id) { + master::RemoveUserTableFromCDCSDKStreamRequestPB req; + master::RemoveUserTableFromCDCSDKStreamResponsePB resp; + + req.set_stream_id(stream_id); + req.set_table_id(table_id); + + RpcController rpc; + // Set a higher timeout since this RPC verifes that each cdc state table entry for the stream + // belongs to one of the tables in the stream metadata. + rpc.set_timeout(MonoDelta::FromSeconds(std::max(timeout_.ToSeconds(), 120.0))); + RETURN_NOT_OK(master_replication_proxy_->RemoveUserTableFromCDCSDKStream(req, &resp, &rpc)); + + if (resp.has_error()) { + cout << "Error removing user table from CDC stream: " << resp.error().status().message() + << endl; + return StatusFromPB(resp.error().status()); + } + + cout << "Successfully removed user table: " << table_id << " from CDC stream: " << stream_id + << "\n"; + + return Status::OK(); +} + +Status ClusterAdminClient::ValidateAndSyncCDCStateEntriesForCDCSDKStream( + const std::string& stream_id) { + master::ValidateAndSyncCDCStateEntriesForCDCSDKStreamRequestPB req; + master::ValidateAndSyncCDCStateEntriesForCDCSDKStreamResponsePB resp; + + req.set_stream_id(stream_id); + + RpcController rpc; + rpc.set_timeout(timeout_); + RETURN_NOT_OK( + master_replication_proxy_->ValidateAndSyncCDCStateEntriesForCDCSDKStream(req, &resp, &rpc)); + + if (resp.has_error()) { + cout << "Error validating CDC state table entries on CDC stream: " + << resp.error().status().message() << endl; + return StatusFromPB(resp.error().status()); + } + + cout << "Successfully validated and synced CDC state table entries on CDC stream: " << stream_id + << "\n"; + if (resp.updated_tablet_entries().size() > 0) { + cout << "Updated checkpoint for the stream's cdc state table entries for following tablet_ids: " + << AsString(resp.updated_tablet_entries()) << "\n"; + } else { + cout << "No additional entries found in cdc state table that requires update. \n"; + } + + return Status::OK(); +} + Status ClusterAdminClient::WaitForSetupUniverseReplicationToFinish( const string& replication_group_id) { master::IsSetupUniverseReplicationDoneRequestPB req; diff --git a/src/yb/tools/yb-admin_client.h b/src/yb/tools/yb-admin_client.h index e5f9cce51956..0f63f621a829 100644 --- a/src/yb/tools/yb-admin_client.h +++ b/src/yb/tools/yb-admin_client.h @@ -400,6 +400,12 @@ class ClusterAdminClient { Status GetCDCDBStreamInfo(const std::string& db_stream_id); + Status DisableDynamicTableAdditionOnCDCSDKStream(const std::string& stream_id); + + Status RemoveUserTableFromCDCSDKStream(const std::string& stream_id, const std::string& table_id); + + Status ValidateAndSyncCDCStateEntriesForCDCSDKStream(const std::string& stream_id); + Status SetupNamespaceReplicationWithBootstrap(const std::string& replication_id, const std::vector& producer_addresses, const TypedNamespaceName& ns,