diff --git a/utilities/backupable/backupable_db.cc b/utilities/backupable/backupable_db.cc index 6a2f11cfb80..ab640ed4586 100644 --- a/utilities/backupable/backupable_db.cc +++ b/utilities/backupable/backupable_db.cc @@ -634,8 +634,9 @@ Status BackupEngineImpl::CreateNewBackup(DB* db, bool flush_before_backup) { Log(options_.info_log, "Backup failed -- %s", s.ToString().c_str()); Log(options_.info_log, "Backup Statistics %s\n", backup_statistics_.ToString().c_str()); - backups_.erase(new_backup_id); - (void) GarbageCollect(); + // delete files that we might have already written + DeleteBackup(new_backup_id); + GarbageCollect(); return s; } @@ -1013,21 +1014,33 @@ Status BackupEngineImpl::BackupFile(BackupID backup_id, BackupMeta* backup, // if it's shared, we also need to check if it exists -- if it does, // no need to copy it again + bool need_to_copy = true; if (shared && backup_env_->FileExists(dst_path)) { + need_to_copy = false; if (shared_checksum) { Log(options_.info_log, "%s already present, with checksum %u and size %" PRIu64, src_fname.c_str(), checksum_value, size); + } else if (backuped_file_infos_.find(dst_relative) == + backuped_file_infos_.end()) { + // file already exists, but it's not referenced by any backup. overwrite + // the file + Log(options_.info_log, + "%s already present, but not referenced by any backup. We will " + "overwrite the file.", + src_fname.c_str()); + need_to_copy = true; + backup_env_->DeleteFile(dst_path); } else { - backup_env_->GetFileSize(dst_path, &size); // Ignore error + // the file is present and referenced by a backup + db_env_->GetFileSize(src_dir + src_fname, &size); // Ignore error Log(options_.info_log, "%s already present, calculate checksum", src_fname.c_str()); - s = CalculateChecksum(src_dir + src_fname, - db_env_, - size_limit, + s = CalculateChecksum(src_dir + src_fname, db_env_, size_limit, &checksum_value); } - } else { + } + if (need_to_copy) { Log(options_.info_log, "Copying %s to %s", src_fname.c_str(), dst_path_tmp.c_str()); s = CopyFile(src_dir + src_fname, @@ -1117,14 +1130,17 @@ Status BackupEngineImpl::GarbageCollect() { &shared_children); for (auto& child : shared_children) { std::string rel_fname = GetSharedFileRel(child); + auto child_itr = backuped_file_infos_.find(rel_fname); // if it's not refcounted, delete it - if (backuped_file_infos_.find(rel_fname) == backuped_file_infos_.end()) { + if (child_itr == backuped_file_infos_.end() || + child_itr->second->refs == 0) { // this might be a directory, but DeleteFile will just fail in that // case, so we're good Status s = backup_env_->DeleteFile(GetAbsolutePath(rel_fname)); if (s.ok()) { Log(options_.info_log, "Deleted %s", rel_fname.c_str()); } + backuped_file_infos_.erase(rel_fname); } } @@ -1178,7 +1194,9 @@ Status BackupEngineImpl::BackupMeta::AddFile( } } else { if (itr->second->checksum_value != file_info->checksum_value) { - return Status::Corruption("Checksum mismatch for existing backup file"); + return Status::Corruption( + "Checksum mismatch for existing backup file. Delete old backups and " + "try again."); } ++itr->second->refs; // increase refcount if already present } diff --git a/utilities/backupable/backupable_db_test.cc b/utilities/backupable/backupable_db_test.cc index 69ea741a856..1476d9df340 100644 --- a/utilities/backupable/backupable_db_test.cc +++ b/utilities/backupable/backupable_db_test.cc @@ -1023,6 +1023,30 @@ TEST_F(BackupableDBTest, ReadOnlyBackupEngine) { delete db; } +TEST_F(BackupableDBTest, GarbageCollectionBeforeBackup) { + DestroyDB(dbname_, Options()); + OpenBackupableDB(true); + + env_->CreateDirIfMissing(backupdir_ + "/shared"); + std::string file_five = backupdir_ + "/shared/000005.sst"; + std::string file_five_contents = "I'm not really a sst file"; + // this depends on the fact that 00005.sst is the first file created by the DB + ASSERT_OK(file_manager_->WriteToFile(file_five, file_five_contents)); + + FillDB(db_.get(), 0, 100); + // backup overwrites file 000005.sst + ASSERT_TRUE(db_->CreateNewBackup(true).ok()); + + std::string new_file_five_contents; + ASSERT_OK(ReadFileToString(env_, file_five, &new_file_five_contents)); + // file 000005.sst was overwritten + ASSERT_TRUE(new_file_five_contents != file_five_contents); + + CloseBackupableDB(); + + AssertBackupConsistency(0, 0, 100); +} + } // anon namespace } // namespace rocksdb