-
Notifications
You must be signed in to change notification settings - Fork 319
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
- Loading branch information
tsaitsung-han.tht
committed
Sep 20, 2022
1 parent
b02cd0c
commit bf7bd6c
Showing
31 changed files
with
1,508 additions
and
69 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
257 changes: 257 additions & 0 deletions
257
dledger/src/main/java/io/openmessaging/storage/dledger/snapshot/SnapshotManager.java
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,257 @@ | ||
/* | ||
* Copyright 2017-2022 The DLedger Authors. | ||
* | ||
* Licensed under the Apache License, Version 2.0 (the "License"); | ||
* you may not use this file except in compliance with the License. | ||
* You may obtain a copy of the License at | ||
* | ||
* https://www.apache.org/licenses/LICENSE-2.0 | ||
* | ||
* Unless required by applicable law or agreed to in writing, software | ||
* distributed under the License is distributed on an "AS IS" BASIS, | ||
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | ||
* See the License for the specific language governing permissions and | ||
* limitations under the License. | ||
*/ | ||
|
||
package io.openmessaging.storage.dledger.snapshot; | ||
|
||
import io.openmessaging.storage.dledger.DLedgerConfig; | ||
import io.openmessaging.storage.dledger.DLedgerServer; | ||
import io.openmessaging.storage.dledger.entry.DLedgerEntry; | ||
import io.openmessaging.storage.dledger.exception.DLedgerException; | ||
import io.openmessaging.storage.dledger.protocol.DLedgerResponseCode; | ||
import io.openmessaging.storage.dledger.snapshot.file.FileSnapshotStore; | ||
import io.openmessaging.storage.dledger.snapshot.hook.LoadSnapshotHook; | ||
import io.openmessaging.storage.dledger.snapshot.hook.SaveSnapshotHook; | ||
import io.openmessaging.storage.dledger.utils.IOUtils; | ||
import org.slf4j.Logger; | ||
import org.slf4j.LoggerFactory; | ||
|
||
import java.io.File; | ||
import java.io.IOException; | ||
import java.util.Objects; | ||
import java.util.concurrent.CompletableFuture; | ||
|
||
public class SnapshotManager { | ||
|
||
private static Logger logger = LoggerFactory.getLogger(SnapshotManager.class); | ||
|
||
public static final String SNAPSHOT_META_FILE = "snapshot_meta"; | ||
public static final String SNAPSHOT_DATA_FILE = "data"; | ||
public static final String SNAPSHOT_DIR_PREFIX = "snapshot_"; | ||
public static final String SNAPSHOT_TEMP_DIR = "tmp"; | ||
|
||
private DLedgerServer dLedgerServer; | ||
private long lastSnapshotIndex; | ||
private long lastSnapshotTerm; | ||
private final SnapshotStore snapshotStore; | ||
private volatile boolean savingSnapshot; | ||
private volatile boolean loadingSnapshot; | ||
|
||
public SnapshotManager(DLedgerServer dLedgerServer) { | ||
this.dLedgerServer = dLedgerServer; | ||
this.snapshotStore = new FileSnapshotStore(this.dLedgerServer.getDLedgerConfig().getSnapshotStoreBaseDir()); | ||
} | ||
|
||
public boolean isSavingSnapshot() { | ||
return savingSnapshot; | ||
} | ||
|
||
public boolean isLoadingSnapshot() { | ||
return loadingSnapshot; | ||
} | ||
|
||
private class SaveSnapshotAfterHook implements SaveSnapshotHook { | ||
|
||
SnapshotWriter writer; | ||
DLedgerEntry dLedgerEntry; | ||
SnapshotMeta snapshotMeta; | ||
|
||
public SaveSnapshotAfterHook(SnapshotWriter writer, DLedgerEntry dLedgerEntry) { | ||
this.writer = writer; | ||
this.dLedgerEntry = dLedgerEntry; | ||
} | ||
|
||
@Override | ||
public void doHook(SnapshotStatus status) { | ||
CompletableFuture.runAsync(() -> { | ||
saveSnapshotAfter(writer, snapshotMeta, dLedgerEntry, status); | ||
}); | ||
} | ||
|
||
@Override | ||
public void registerSnapshotMeta(SnapshotMeta snapshotMeta) { | ||
this.snapshotMeta = snapshotMeta; | ||
this.writer.setSnapshotMeta(snapshotMeta); | ||
} | ||
|
||
@Override | ||
public SnapshotWriter getSnapshotWriter() { | ||
return this.writer; | ||
} | ||
|
||
@Override | ||
public DLedgerEntry getSnapshotEntry() { | ||
return this.dLedgerEntry; | ||
} | ||
} | ||
|
||
private class LoadSnapshotAfterHook implements LoadSnapshotHook { | ||
|
||
SnapshotReader reader; | ||
SnapshotMeta snapshotMeta; | ||
|
||
public LoadSnapshotAfterHook(SnapshotReader reader) { | ||
this.reader = reader; | ||
} | ||
|
||
@Override | ||
public void doHook(SnapshotStatus status) { | ||
loadSnapshotAfter(reader, snapshotMeta, status); | ||
} | ||
|
||
@Override | ||
public void registerSnapshotMeta(SnapshotMeta snapshotMeta) { | ||
this.snapshotMeta = snapshotMeta; | ||
} | ||
|
||
@Override | ||
public SnapshotReader getSnapshotReader() { | ||
return this.reader; | ||
} | ||
} | ||
|
||
public void saveSnapshot(DLedgerEntry dLedgerEntry) { | ||
// Check if still saving other snapshots | ||
if (this.savingSnapshot) { | ||
return; | ||
} | ||
// Check if applied index reaching the snapshot threshold | ||
if (dLedgerEntry.getIndex() - this.lastSnapshotIndex <= this.dLedgerServer.getDLedgerConfig().getSnapshotThreshold()) { | ||
return; | ||
} | ||
// Create snapshot writer | ||
SnapshotWriter writer = this.snapshotStore.createSnapshotWriter(); | ||
if (writer == null) { | ||
return; | ||
} | ||
// Start saving snapshot | ||
this.savingSnapshot = true; | ||
SaveSnapshotAfterHook saveSnapshotAfter = new SaveSnapshotAfterHook(writer, dLedgerEntry); | ||
if (!this.dLedgerServer.getFsmCaller().onSnapshotSave(saveSnapshotAfter)) { | ||
logger.error("Unable to call statemachine onSnapshotSave"); | ||
saveSnapshotAfter.doHook(SnapshotStatus.FAIL); | ||
} | ||
} | ||
|
||
private void saveSnapshotAfter(SnapshotWriter writer, SnapshotMeta snapshotMeta, DLedgerEntry dLedgerEntry, SnapshotStatus status) { | ||
int res = status.getCode(); | ||
// Update snapshot meta | ||
if (res == SnapshotStatus.SUCCESS.getCode()) { | ||
writer.setSnapshotMeta(snapshotMeta); | ||
} | ||
// Write snapshot meta into files and close snapshot writer | ||
try { | ||
writer.save(status); | ||
} catch (IOException e) { | ||
logger.error("Unable to close snapshot writer", e); | ||
res = SnapshotStatus.FAIL.getCode(); | ||
} | ||
if (res == SnapshotStatus.SUCCESS.getCode()) { | ||
this.lastSnapshotIndex = snapshotMeta.getLastIncludedIndex(); | ||
this.lastSnapshotTerm = snapshotMeta.getLastIncludedTerm(); | ||
logger.info("Snapshot {} saved successfully", snapshotMeta); | ||
// Remove previous logs | ||
truncatePrefix(dLedgerEntry); | ||
} else { | ||
logger.error("Unable to save snapshot"); | ||
} | ||
this.savingSnapshot = false; | ||
} | ||
|
||
private void truncatePrefix(DLedgerEntry entry) { | ||
this.dLedgerServer.getFsmCaller().getdLedgerStore().resetOffsetAfterSnapshot(entry); | ||
deleteExpiredSnapshot(); | ||
} | ||
|
||
private void deleteExpiredSnapshot() { | ||
// Remove the oldest snapshot | ||
DLedgerConfig config = dLedgerServer.getDLedgerConfig(); | ||
File[] snapshotFiles = new File(config.getSnapshotStoreBaseDir()).listFiles(); | ||
if (snapshotFiles != null && snapshotFiles.length > config.getMaxSnapshotReservedNum()) { | ||
long minSnapshotIdx = Long.MAX_VALUE; | ||
for (File file : snapshotFiles) { | ||
String fileName = file.getName(); | ||
if (!fileName.startsWith(SnapshotManager.SNAPSHOT_DIR_PREFIX)) { | ||
continue; | ||
} | ||
minSnapshotIdx = Math.min(Long.parseLong(fileName.substring(SnapshotManager.SNAPSHOT_DIR_PREFIX.length())), minSnapshotIdx); | ||
} | ||
String deleteFilePath = config.getSnapshotStoreBaseDir() + File.separator + SnapshotManager.SNAPSHOT_DIR_PREFIX + minSnapshotIdx; | ||
try { | ||
IOUtils.deleteFile(new File(deleteFilePath)); | ||
} catch (IOException e) { | ||
logger.error("Unable to remove expired snapshot: {}", deleteFilePath, e); | ||
} | ||
} | ||
} | ||
|
||
public void loadSnapshot() { | ||
// Check if still loading snapshot | ||
if (loadingSnapshot) { | ||
return; | ||
} | ||
// Create snapshot reader | ||
SnapshotReader reader = snapshotStore.createSnapshotReader(); | ||
if (reader == null) { | ||
return; | ||
} | ||
// Start loading snapshot | ||
this.loadingSnapshot = true; | ||
LoadSnapshotAfterHook loadSnapshotAfter = new LoadSnapshotAfterHook(reader); | ||
if (!this.dLedgerServer.getFsmCaller().onSnapshotLoad(loadSnapshotAfter)) { | ||
this.dLedgerServer.getFsmCaller().setError(this.dLedgerServer, | ||
new DLedgerException(DLedgerResponseCode.LOAD_SNAPSHOT_ERROR, "Unable to call statemachine onSnapshotLoad")); | ||
} | ||
} | ||
|
||
private void loadSnapshotAfter(SnapshotReader reader, SnapshotMeta snapshotMeta, SnapshotStatus status) { | ||
if (status.getCode() == SnapshotStatus.SUCCESS.getCode()) { | ||
this.lastSnapshotIndex = snapshotMeta.getLastIncludedIndex(); | ||
this.lastSnapshotTerm = snapshotMeta.getLastIncludedTerm(); | ||
this.loadingSnapshot = false; | ||
logger.info("Snapshot {} loaded successfully", snapshotMeta); | ||
} else { | ||
// Stop the loading process if the snapshot is expired or the beginning index of file store is 0 | ||
if (status.getCode() == SnapshotStatus.EXPIRED.getCode() || | ||
this.dLedgerServer.getFsmCaller().getdLedgerStore().getLedgerBeginIndex() == 0) { | ||
this.loadingSnapshot = false; | ||
return; | ||
} | ||
// Remove the error snapshot | ||
boolean failed = false; | ||
try { | ||
IOUtils.deleteFile(new File(reader.getSnapshotStorePath())); | ||
} catch (IOException e) { | ||
logger.error("Unable to remove error snapshot: {}", reader.getSnapshotStorePath(), e); | ||
failed = true; | ||
} | ||
// Check if there is snapshot exists | ||
DLedgerConfig config = this.dLedgerServer.getDLedgerConfig(); | ||
if (Objects.requireNonNull(new File(config.getSnapshotStoreBaseDir()).listFiles()).length == 0) { | ||
logger.error("No snapshot for recovering state machine: {}", config.getSnapshotStoreBaseDir()); | ||
failed = true; | ||
} | ||
if (failed) { | ||
this.dLedgerServer.getFsmCaller().setError(this.dLedgerServer, | ||
new DLedgerException(DLedgerResponseCode.LOAD_SNAPSHOT_ERROR, "Fail to recover state machine")); | ||
return; | ||
} | ||
// Retry loading the previous snapshots | ||
logger.warn("Load snapshot from {} failed. Start recovering from the previous snapshot", reader.getSnapshotStorePath()); | ||
this.loadingSnapshot = false; | ||
loadSnapshot(); | ||
} | ||
} | ||
} |
Oops, something went wrong.