-
Notifications
You must be signed in to change notification settings - Fork 293
New issue
Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.
By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.
Already on GitHub? Sign in to your account
endpoint to return backup queue, metatdata and pending files count #1100
base: 4.x
Are you sure you want to change the base?
Changes from all commits
File filter
Filter by extension
Conversations
Jump to
Diff view
Diff view
There are no files selected for viewing
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,66 @@ | ||
package com.netflix.priam.backup; | ||
|
||
import java.io.IOException; | ||
import java.nio.file.*; | ||
import java.nio.file.attribute.BasicFileAttributes; | ||
|
||
/** Estimates remaining bytes or files to upload in a backup by looking at the file system */ | ||
public class IncrementalBackupDirectorySize implements DirectorySize { | ||
|
||
public long getBytes(String location) { | ||
SummingFileVisitor fileVisitor = new SummingFileVisitor(); | ||
try { | ||
Files.walkFileTree(Paths.get(location), fileVisitor); | ||
} catch (IOException e) { | ||
// BackupFileVisitor is happy with an estimate and won't produce these in practice. | ||
} | ||
return fileVisitor.getTotalBytes(); | ||
} | ||
|
||
public int getFiles(String location) { | ||
SummingFileVisitor fileVisitor = new SummingFileVisitor(); | ||
try { | ||
Files.walkFileTree(Paths.get(location), fileVisitor); | ||
} catch (IOException e) { | ||
// BackupFileVisitor is happy with an estimate and won't produce these in practice. | ||
} | ||
return fileVisitor.getTotalFiles(); | ||
} | ||
|
||
private static final class SummingFileVisitor implements FileVisitor<Path> { | ||
private long totalBytes; | ||
private int totalFiles; | ||
|
||
@Override | ||
public FileVisitResult preVisitDirectory(Path dir, BasicFileAttributes attrs) { | ||
return FileVisitResult.CONTINUE; | ||
} | ||
|
||
@Override | ||
public FileVisitResult visitFile(Path file, BasicFileAttributes attrs) { | ||
if (file.toString().contains(AbstractBackup.INCREMENTAL_BACKUP_FOLDER) && attrs.isRegularFile()) { | ||
totalBytes += attrs.size(); | ||
totalFiles += 1; | ||
} | ||
return FileVisitResult.CONTINUE; | ||
} | ||
|
||
@Override | ||
public FileVisitResult visitFileFailed(Path file, IOException exc) { | ||
return FileVisitResult.CONTINUE; | ||
} | ||
|
||
@Override | ||
public FileVisitResult postVisitDirectory(Path dir, IOException exc) { | ||
return FileVisitResult.CONTINUE; | ||
} | ||
|
||
long getTotalBytes() { | ||
return totalBytes; | ||
} | ||
|
||
int getTotalFiles() { | ||
return totalFiles; | ||
} | ||
} | ||
} |
Original file line number | Diff line number | Diff line change |
---|---|---|
|
@@ -17,6 +17,8 @@ | |
|
||
package com.netflix.priam.resources; | ||
|
||
import com.fasterxml.jackson.databind.ObjectMapper; | ||
import com.netflix.priam.PriamServer; | ||
import com.netflix.priam.backup.*; | ||
import com.netflix.priam.backupv2.BackupTTLTask; | ||
import com.netflix.priam.backupv2.BackupV2Service; | ||
|
@@ -29,7 +31,9 @@ | |
import com.netflix.priam.utils.GsonJsonSerializer; | ||
import java.time.Instant; | ||
import java.time.temporal.ChronoUnit; | ||
import java.util.HashMap; | ||
import java.util.List; | ||
import java.util.Map; | ||
import java.util.Optional; | ||
import java.util.stream.Collectors; | ||
import javax.inject.Inject; | ||
|
@@ -55,6 +59,8 @@ public class BackupServletV2 { | |
private final Provider<AbstractBackupPath> pathProvider; | ||
private final BackupV2Service backupService; | ||
private final BackupNotificationMgr backupNotificationMgr; | ||
private final PriamServer priamServer; | ||
|
||
private static final String REST_SUCCESS = "[\"ok\"]"; | ||
|
||
@Inject | ||
|
@@ -68,7 +74,8 @@ public BackupServletV2( | |
@Named("v2") IMetaProxy metaV2Proxy, | ||
Provider<AbstractBackupPath> pathProvider, | ||
BackupV2Service backupService, | ||
BackupNotificationMgr backupNotificationMgr) { | ||
BackupNotificationMgr backupNotificationMgr, | ||
PriamServer priamServer) { | ||
this.backupStatusMgr = backupStatusMgr; | ||
this.backupVerification = backupVerification; | ||
this.snapshotMetaService = snapshotMetaService; | ||
|
@@ -78,6 +85,7 @@ public BackupServletV2( | |
this.pathProvider = pathProvider; | ||
this.backupService = backupService; | ||
this.backupNotificationMgr = backupNotificationMgr; | ||
this.priamServer = priamServer; | ||
} | ||
|
||
@GET | ||
|
@@ -181,4 +189,26 @@ public Response list(@PathParam("daterange") String daterange) throws Exception | |
.collect(Collectors.toList()))) | ||
.build(); | ||
} | ||
|
||
@GET | ||
@Path("/state/{hours}") | ||
public Response backupState(@PathParam("hours") int hours) throws Exception { | ||
Map<String, Object> responseMap = new HashMap<>(); | ||
|
||
responseMap.put("tasksQueued", fs.getUploadTasksQueued()); | ||
responseMap.put("queueSize", priamServer.getConfiguration().getBackupQueueSize()); | ||
for (Map.Entry<String, Integer> entry : | ||
backupService.countPendingBackupFiles().entrySet()) { | ||
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Why do we need to make a distinction between snapshot and incremental backup files in this case? Prefer to combine them into a total count if we can afford to. There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Addressed this in new commit |
||
responseMap.put(entry.getKey(), entry.getValue()); | ||
} | ||
|
||
List<BackupMetadata> latestBackupMetadata = | ||
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. We can get this metadata from elsewhere. Please don't make the local node do it. Prefer creating an Antigravity endpoint that fetches this information from cass_cde. There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. We want a node specific backup metadata in the realtime to compute if the backup was started in last 30 mins. There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. i would also be concerned that we are depending on an additional system as I commented above. Is there a harm in checking this here? |
||
backupStatusMgr.getLatestBackupMetadata( | ||
new DateRange(Instant.now().minus(hours, ChronoUnit.HOURS), Instant.now())); | ||
responseMap.put("latestBackupMetadata", latestBackupMetadata); | ||
|
||
ObjectMapper mapper = new ObjectMapper(); | ||
String jsonResponse = mapper.writeValueAsString(responseMap); | ||
return Response.ok(jsonResponse).build(); | ||
} | ||
} |
There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
This does not require information that only the local node has. Please read it from fast properties. Or better yet, don't include it in the calculations as we might move to a model where the queue is small and populated as needed and the only metric that matters is the remaining files on disk.
There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
This FP is not set for every cluster and we need it to compute the file threshold for which we want to wait for backup upload to complete.
There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
Since we are already making a call to Priam what is the harm in checking this here? The downside I see to checking FPs is we now rely on yet another system and per Ayushis comment would have the default hardcoded in multiple places.