Skip to content

Commit

Permalink
Restore incremental backups of secondary index sstables. (#1093)
Browse files Browse the repository at this point in the history
* Remove last usage of CL BackupFileType.

* Remove unused remotePrefix() method.

* Create DateRange::contains to consolidate recurring logic in a consistent way.

* Change IMetaProxy API to return an ImmutableList of AbstractBackupPaths when fetching incrementals. The iterators are always fully materialized. Also, remove the now-redundant method from BackupRestoreUtil that merely wrapped the MetaProxy call.

* Include incremental secondary index files in restore.
  • Loading branch information
mattl-netflix committed Jun 1, 2024
1 parent 2bdd2d1 commit e93d85e
Show file tree
Hide file tree
Showing 11 changed files with 100 additions and 107 deletions.
Original file line number Diff line number Diff line change
Expand Up @@ -26,7 +26,6 @@
import java.nio.file.Path;
import java.nio.file.Paths;
import java.time.Instant;
import java.util.Date;
import java.util.List;
import javax.inject.Inject;

Expand Down Expand Up @@ -149,14 +148,6 @@ public void parsePartialPrefix(String remoteFilePath) {
token = remotePath.getName(3).toString();
}

@Override
public String remotePrefix(Date start, Date end, String location) {
return PATH_JOINER.join(
clusterPrefix(location),
instanceIdentity.getInstance().getToken(),
match(start, end));
}

@Override
public Path remoteV2Prefix(Path location, BackupFileType fileType) {
if (location.getNameCount() <= 1) {
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -47,7 +47,6 @@ public abstract class AbstractBackupPath implements Comparable<AbstractBackupPat
ImmutableMap.of(BackupFolder.BACKUPS, 3, BackupFolder.SNAPSHOTS, 4);

public enum BackupFileType {
CL,
META_V2,
SECONDARY_INDEX_V2,
SNAPSHOT_VERIFIED,
Expand Down Expand Up @@ -149,9 +148,6 @@ public File newRestoreFile() {
File return_;
String dataDir = config.getDataFileLocation();
switch (type) {
case CL:
return_ = new File(PATH_JOINER.join(config.getBackupCommitLogLocation(), fileName));
break;
case SECONDARY_INDEX_V2:
String restoreFileName =
PATH_JOINER.join(dataDir, keyspace, columnFamily, indexDir, fileName);
Expand Down Expand Up @@ -188,11 +184,6 @@ public boolean equals(Object obj) {
/** Parses paths with just token prefixes */
public abstract void parsePartialPrefix(String remoteFilePath);

/**
* Provides a common prefix that matches all objects that fall between the start and end time
*/
public abstract String remotePrefix(Date start, Date end, String location);

public abstract Path remoteV2Prefix(Path location, BackupFileType fileType);

/** Provides the cluster prefix */
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -21,7 +21,6 @@
import com.netflix.priam.backupv2.IMetaProxy;
import com.netflix.priam.utils.DateUtil;
import java.nio.file.Path;
import java.time.Instant;
import java.util.*;
import java.util.regex.Pattern;
import java.util.stream.Collectors;
Expand Down Expand Up @@ -83,19 +82,6 @@ public static List<AbstractBackupPath> getMostRecentSnapshotPaths(
return snapshotPaths;
}

public static List<AbstractBackupPath> getIncrementalPaths(
AbstractBackupPath latestValidMetaFile,
DateUtil.DateRange dateRange,
IMetaProxy metaProxy) {
Instant snapshotTime;
snapshotTime = latestValidMetaFile.getLastModified();
DateUtil.DateRange incrementalDateRange =
new DateUtil.DateRange(snapshotTime, dateRange.getEndTime());
List<AbstractBackupPath> incrementalPaths = new ArrayList<>();
metaProxy.getIncrementals(incrementalDateRange).forEachRemaining(incrementalPaths::add);
return incrementalPaths;
}

public static Map<String, List<String>> getFilter(String inputFilter)
throws IllegalArgumentException {
if (StringUtils.isEmpty(inputFilter)) return null;
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -209,18 +209,7 @@ public List<BackupMetadata> getLatestBackupMetadata(DateUtil.DateRange dateRange
.stream()
.filter(Objects::nonNull)
.filter(backupMetadata -> backupMetadata.getStatus() == Status.FINISHED)
.filter(
backupMetadata ->
backupMetadata
.getStart()
.toInstant()
.compareTo(dateRange.getStartTime())
>= 0
&& backupMetadata
.getStart()
.toInstant()
.compareTo(dateRange.getEndTime())
<= 0)
.filter(backupMetadata -> dateRange.contains(backupMetadata.getStart().toInstant()))
.sorted(Comparator.comparing(BackupMetadata::getStart).reversed())
.collect(Collectors.toList());
}
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -17,12 +17,12 @@

package com.netflix.priam.backupv2;

import com.google.common.collect.ImmutableList;
import com.netflix.priam.backup.AbstractBackupPath;
import com.netflix.priam.backup.BackupRestoreException;
import com.netflix.priam.backup.BackupVerificationResult;
import com.netflix.priam.utils.DateUtil;
import java.nio.file.Path;
import java.util.Iterator;
import java.util.List;

/** Proxy to do management tasks for meta files. Created by aagrawal on 12/18/18. */
Expand Down Expand Up @@ -78,7 +78,7 @@ public interface IMetaProxy {
* @param dateRange the time period to scan in the remote file system for incremental files.
* @return iterator containing the list of path on the remote file system satisfying criteria.
*/
Iterator<AbstractBackupPath> getIncrementals(DateUtil.DateRange dateRange);
ImmutableList<AbstractBackupPath> getIncrementals(DateUtil.DateRange dateRange);

/**
* Validate that all the files mentioned in the meta file actually exists on remote file system.
Expand Down
58 changes: 24 additions & 34 deletions priam/src/main/java/com/netflix/priam/backupv2/MetaV2Proxy.java
Original file line number Diff line number Diff line change
Expand Up @@ -17,6 +17,7 @@

package com.netflix.priam.backupv2;

import com.google.common.collect.ImmutableList;
import com.netflix.priam.backup.AbstractBackupPath;
import com.netflix.priam.backup.BackupRestoreException;
import com.netflix.priam.backup.BackupVerificationResult;
Expand All @@ -31,8 +32,6 @@
import java.util.*;
import javax.inject.Inject;
import javax.inject.Provider;
import org.apache.commons.collections4.iterators.FilterIterator;
import org.apache.commons.collections4.iterators.TransformIterator;
import org.apache.commons.io.FileUtils;
import org.apache.commons.io.filefilter.FileFilterUtils;
import org.apache.commons.io.filefilter.IOFileFilter;
Expand Down Expand Up @@ -84,40 +83,34 @@ private String getMatch(
}

@Override
public Iterator<AbstractBackupPath> getIncrementals(DateUtil.DateRange dateRange) {
String incrementalPrefix = getMatch(dateRange, AbstractBackupPath.BackupFileType.SST_V2);
String marker =
getMatch(
new DateUtil.DateRange(dateRange.getStartTime(), null),
AbstractBackupPath.BackupFileType.SST_V2);
public ImmutableList<AbstractBackupPath> getIncrementals(DateUtil.DateRange dateRange) {
return new ImmutableList.Builder<AbstractBackupPath>()
.addAll(getIncrementals(dateRange, AbstractBackupPath.BackupFileType.SST_V2))
.addAll(
getIncrementals(
dateRange, AbstractBackupPath.BackupFileType.SECONDARY_INDEX_V2))
.build();
}

private ImmutableList<AbstractBackupPath> getIncrementals(
DateUtil.DateRange dateRange, AbstractBackupPath.BackupFileType type) {
String incrementalPrefix = getMatch(dateRange, type);
String marker = getMatch(new DateUtil.DateRange(dateRange.getStartTime(), null), type);
logger.info(
"Listing filesystem with prefix: {}, marker: {}, daterange: {}",
incrementalPrefix,
marker,
dateRange);
Iterator<String> iterator = fs.listFileSystem(incrementalPrefix, null, marker);
Iterator<AbstractBackupPath> transformIterator =
new TransformIterator<>(
iterator,
s -> {
AbstractBackupPath path = abstractBackupPathProvider.get();
path.parseRemote(s);
return path;
});

return new FilterIterator<>(
transformIterator,
abstractBackupPath ->
(abstractBackupPath.getLastModified().isAfter(dateRange.getStartTime())
&& abstractBackupPath
.getLastModified()
.isBefore(dateRange.getEndTime()))
|| abstractBackupPath
.getLastModified()
.equals(dateRange.getStartTime())
|| abstractBackupPath
.getLastModified()
.equals(dateRange.getEndTime()));
ImmutableList.Builder<AbstractBackupPath> results = ImmutableList.builder();
while (iterator.hasNext()) {
AbstractBackupPath path = abstractBackupPathProvider.get();
path.parseRemote(iterator.next());
if (dateRange.contains(path.getLastModified())) {
results.add(path);
}
}
return results.build();
}

@Override
Expand All @@ -136,10 +129,7 @@ public List<AbstractBackupPath> findMetaFiles(DateUtil.DateRange dateRange) {
AbstractBackupPath abstractBackupPath = abstractBackupPathProvider.get();
abstractBackupPath.parseRemote(iterator.next());
logger.debug("Meta file found: {}", abstractBackupPath);
if (abstractBackupPath.getLastModified().toEpochMilli()
>= dateRange.getStartTime().toEpochMilli()
&& abstractBackupPath.getLastModified().toEpochMilli()
<= dateRange.getEndTime().toEpochMilli()) {
if (dateRange.contains(abstractBackupPath.getLastModified())) {
metas.add(abstractBackupPath);
}
}
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -160,25 +160,19 @@ public Response validateV2SnapshotByDate(
@Path("/list/{daterange}")
public Response list(@PathParam("daterange") String daterange) throws Exception {
DateUtil.DateRange dateRange = new DateUtil.DateRange(daterange);
// Find latest valid meta file.
Optional<AbstractBackupPath> latestValidMetaFile =
Optional<AbstractBackupPath> metaFile =
BackupRestoreUtil.getLatestValidMetaPath(metaProxy, dateRange);
if (!latestValidMetaFile.isPresent()) {
if (!metaFile.isPresent()) {
return Response.ok("No valid meta found!").build();
}
List<AbstractBackupPath> allFiles =
List<AbstractBackupPath> files =
BackupRestoreUtil.getMostRecentSnapshotPaths(
latestValidMetaFile.get(), metaProxy, pathProvider);
allFiles.addAll(
BackupRestoreUtil.getIncrementalPaths(
latestValidMetaFile.get(), dateRange, metaProxy));

return Response.ok(
GsonJsonSerializer.getGson()
.toJson(
allFiles.stream()
.map(AbstractBackupPath::getRemotePath)
.collect(Collectors.toList())))
.build();
metaFile.get(), metaProxy, pathProvider);
DateUtil.DateRange incrementalDateRange =
new DateRange(metaFile.get().getLastModified(), dateRange.getEndTime());
files.addAll(metaProxy.getIncrementals(incrementalDateRange));
List<String> remotePaths =
files.stream().map(AbstractBackupPath::getRemotePath).collect(Collectors.toList());
return Response.ok(GsonJsonSerializer.getGson().toJson(remotePaths)).build();
}
}
Original file line number Diff line number Diff line change
Expand Up @@ -220,9 +220,11 @@ public void restore(DateUtil.DateRange dateRange) throws Exception {
BackupRestoreUtil.getMostRecentSnapshotPaths(
latestValidMetaFile.get(), metaProxy, pathProvider);
if (!config.skipIncrementalRestore()) {
allFiles.addAll(
BackupRestoreUtil.getIncrementalPaths(
latestValidMetaFile.get(), dateRange, metaProxy));
DateUtil.DateRange incrementalDateRange =
new DateUtil.DateRange(
latestValidMetaFile.get().getLastModified(),
dateRange.getEndTime());
allFiles.addAll(metaProxy.getIncrementals(incrementalDateRange));
}

// Download snapshot which is listed in the meta file.
Expand Down
4 changes: 4 additions & 0 deletions priam/src/main/java/com/netflix/priam/utils/DateUtil.java
Original file line number Diff line number Diff line change
Expand Up @@ -215,6 +215,10 @@ public Instant getEndTime() {
return endTime;
}

public boolean contains(Instant instant) {
return startTime.compareTo(instant) <= 0 && endTime.compareTo(instant) >= 0;
}

public String toString() {
return GsonJsonSerializer.getGson().toJson(this);
}
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -17,6 +17,8 @@

package com.netflix.priam.backupv2;

import com.google.common.collect.ImmutableList;
import com.google.common.truth.Truth;
import com.google.inject.Guice;
import com.google.inject.Injector;
import com.netflix.priam.backup.AbstractBackupPath;
Expand All @@ -32,7 +34,6 @@
import java.time.Instant;
import java.time.temporal.ChronoUnit;
import java.util.ArrayList;
import java.util.Iterator;
import java.util.List;
import java.util.stream.Collectors;
import javax.inject.Provider;
Expand Down Expand Up @@ -131,13 +132,16 @@ public void testGetSSTFilesFromMeta() throws Exception {
@Test
public void testGetIncrementalFiles() throws Exception {
DateUtil.DateRange dateRange = new DateUtil.DateRange("202812071820,20281229");
Iterator<AbstractBackupPath> incrementals = metaProxy.getIncrementals(dateRange);
int i = 0;
while (incrementals.hasNext()) {
System.out.println(incrementals.next());
i++;
}
Assert.assertEquals(3, i);
ImmutableList<AbstractBackupPath> paths = metaProxy.getIncrementals(dateRange);
Truth.assertThat(paths).hasSize(4);
}

@Test
public void testGetIncrementalFilesIncludesSecondaryIndexes() throws Exception {
DateUtil.DateRange dateRange = new DateUtil.DateRange("202812071820,20281229");
ImmutableList<AbstractBackupPath> paths = metaProxy.getIncrementals(dateRange);
Truth.assertThat(paths.get(3).getType())
.isEqualTo(AbstractBackupPath.BackupFileType.SECONDARY_INDEX_V2);
}

@Test
Expand Down Expand Up @@ -227,6 +231,17 @@ private List<String> getRemoteFakeFiles() {
"SNAPPY",
"PLAINTEXT",
"file4-Data.db"));
files.add(
Paths.get(
getPrefix(),
AbstractBackupPath.BackupFileType.SECONDARY_INDEX_V2.toString(),
"1859828420000",
"keyspace1",
"columnfamily1",
"index1",
"SNAPPY",
"PLAINTEXT",
"file5-Data.db"));
files.add(
Paths.get(
getPrefix(),
Expand Down
31 changes: 31 additions & 0 deletions priam/src/test/java/com/netflix/priam/utils/TestDateUtils.java
Original file line number Diff line number Diff line change
Expand Up @@ -17,6 +17,7 @@

package com.netflix.priam.utils;

import com.google.common.truth.Truth;
import java.time.Duration;
import java.time.Instant;
import java.time.temporal.ChronoUnit;
Expand Down Expand Up @@ -100,4 +101,34 @@ public void testFutureDateRangeValues() {
Assert.assertEquals(Instant.ofEpochSecond(1830686460), dateRange.getEndTime());
Assert.assertEquals("1830", dateRange.match());
}

@Test
public void testContainsInstantBeforeStartTime() {
DateUtil.DateRange dateRange = new DateUtil.DateRange("202404301200,202405011200");
Truth.assertThat(dateRange.contains(Instant.parse("2024-04-29T12:00:00Z"))).isFalse();
}

@Test
public void testContainsInstantEqualToStartTime() {
DateUtil.DateRange dateRange = new DateUtil.DateRange("202404301200,202405011200");
Truth.assertThat(dateRange.contains(Instant.parse("2024-04-30T12:00:00Z"))).isTrue();
}

@Test
public void testContainsInstantBetweenStartAndEndTimes() {
DateUtil.DateRange dateRange = new DateUtil.DateRange("202404301200,202405011200");
Truth.assertThat(dateRange.contains(Instant.parse("2024-05-01T00:00:00Z"))).isTrue();
}

@Test
public void testContainsInstantEqualToEndTime() {
DateUtil.DateRange dateRange = new DateUtil.DateRange("202404301200,202405011200");
Truth.assertThat(dateRange.contains(Instant.parse("2024-05-01T12:00:00Z"))).isTrue();
}

@Test
public void testContainsInstantAfterEndTime() {
DateUtil.DateRange dateRange = new DateUtil.DateRange("202404301200,202405011200");
Truth.assertThat(dateRange.contains(Instant.parse("2024-05-02T12:00:00Z"))).isFalse();
}
}

0 comments on commit e93d85e

Please sign in to comment.