193 lines
5.9 KiB
Java
193 lines
5.9 KiB
Java
package it.cavallium.dbengine.database.disk;
|
|
|
|
import static it.cavallium.dbengine.database.LLUtils.MARKER_ROCKSDB;
|
|
|
|
import io.micrometer.core.instrument.MeterRegistry;
|
|
import io.netty5.buffer.api.Buffer;
|
|
import io.netty5.buffer.api.BufferAllocator;
|
|
import io.netty5.buffer.api.MemoryManager;
|
|
import io.netty5.buffer.api.Send;
|
|
import it.cavallium.dbengine.database.LLDelta;
|
|
import it.cavallium.dbengine.database.LLUtils;
|
|
import java.io.IOException;
|
|
import java.util.concurrent.locks.Lock;
|
|
import java.util.concurrent.locks.StampedLock;
|
|
import org.jetbrains.annotations.NotNull;
|
|
import org.jetbrains.annotations.Nullable;
|
|
import org.rocksdb.ColumnFamilyHandle;
|
|
import org.rocksdb.ReadOptions;
|
|
import org.rocksdb.RocksDBException;
|
|
import org.rocksdb.Transaction;
|
|
import org.rocksdb.TransactionDB;
|
|
import org.rocksdb.TransactionOptions;
|
|
import org.rocksdb.WriteOptions;
|
|
import reactor.core.scheduler.Schedulers;
|
|
|
|
public final class PessimisticRocksDBColumn extends AbstractRocksDBColumn<TransactionDB> {
|
|
|
|
private static final TransactionOptions DEFAULT_TX_OPTIONS = new TransactionOptions();
|
|
|
|
public PessimisticRocksDBColumn(TransactionDB db,
|
|
boolean nettyDirect,
|
|
BufferAllocator alloc,
|
|
String dbName,
|
|
ColumnFamilyHandle cfh,
|
|
MeterRegistry meterRegistry,
|
|
StampedLock closeLock) {
|
|
super(db, nettyDirect, alloc, dbName, cfh, meterRegistry, closeLock);
|
|
}
|
|
|
|
@Override
|
|
protected boolean commitOptimistically(Transaction tx) throws RocksDBException {
|
|
tx.commit();
|
|
return true;
|
|
}
|
|
|
|
@Override
|
|
protected Transaction beginTransaction(@NotNull WriteOptions writeOptions,
|
|
TransactionOptions txOpts) {
|
|
return getDb().beginTransaction(writeOptions, txOpts);
|
|
}
|
|
|
|
@Override
|
|
public @NotNull UpdateAtomicResult updateAtomicImpl(@NotNull ReadOptions readOptions,
|
|
@NotNull WriteOptions writeOptions,
|
|
Buffer key,
|
|
BinarySerializationFunction updater,
|
|
UpdateAtomicResultMode returnMode) throws IOException {
|
|
long initNanoTime = System.nanoTime();
|
|
try {
|
|
var cfh = getCfh();
|
|
var keyArray = LLUtils.toArray(key);
|
|
if (Schedulers.isInNonBlockingThread()) {
|
|
throw new UnsupportedOperationException("Called update in a nonblocking thread");
|
|
}
|
|
try (var txOpts = new TransactionOptions();
|
|
var tx = beginTransaction(writeOptions, txOpts)) {
|
|
Buffer prevData = null;
|
|
Buffer newData = null;
|
|
try {
|
|
boolean changed;
|
|
if (logger.isTraceEnabled()) {
|
|
logger.trace(MARKER_ROCKSDB, "Reading {} (before update lock)", LLUtils.toStringSafe(key));
|
|
}
|
|
var prevDataArray = tx.getForUpdate(readOptions, cfh, keyArray, true);
|
|
try {
|
|
if (logger.isTraceEnabled()) {
|
|
logger.trace(MARKER_ROCKSDB,
|
|
"Reading {}: {} (before update)",
|
|
LLUtils.toStringSafe(key),
|
|
LLUtils.toStringSafe(prevDataArray)
|
|
);
|
|
}
|
|
if (prevDataArray != null) {
|
|
readValueFoundWithoutBloomBufferSize.record(prevDataArray.length);
|
|
prevData = MemoryManager.unsafeWrap(prevDataArray);
|
|
} else {
|
|
readValueNotFoundWithoutBloomBufferSize.record(0);
|
|
}
|
|
Buffer prevDataToSendToUpdater;
|
|
if (prevData != null) {
|
|
prevDataToSendToUpdater = prevData.copy().makeReadOnly();
|
|
} else {
|
|
prevDataToSendToUpdater = null;
|
|
}
|
|
|
|
try {
|
|
newData = updater.apply(prevDataToSendToUpdater);
|
|
} finally {
|
|
if (prevDataToSendToUpdater != null && prevDataToSendToUpdater.isAccessible()) {
|
|
prevDataToSendToUpdater.close();
|
|
}
|
|
}
|
|
var newDataArray = newData == null ? null : LLUtils.toArray(newData);
|
|
if (logger.isTraceEnabled()) {
|
|
logger.trace(MARKER_ROCKSDB,
|
|
"Updating {}. previous data: {}, updated data: {}",
|
|
LLUtils.toStringSafe(key),
|
|
LLUtils.toStringSafe(prevDataArray),
|
|
LLUtils.toStringSafe(newDataArray)
|
|
);
|
|
}
|
|
if (prevData != null && newData == null) {
|
|
if (logger.isTraceEnabled()) {
|
|
logger.trace(MARKER_ROCKSDB, "Deleting {} (after update)", LLUtils.toStringSafe(key));
|
|
}
|
|
writeValueBufferSize.record(0);
|
|
tx.delete(cfh, keyArray, true);
|
|
changed = true;
|
|
tx.commit();
|
|
} else if (newData != null && (prevData == null || !LLUtils.equals(prevData, newData))) {
|
|
if (logger.isTraceEnabled()) {
|
|
logger.trace(MARKER_ROCKSDB,
|
|
"Writing {}: {} (after update)",
|
|
LLUtils.toStringSafe(key),
|
|
LLUtils.toStringSafe(newData)
|
|
);
|
|
}
|
|
writeValueBufferSize.record(newDataArray.length);
|
|
tx.put(cfh, keyArray, newDataArray);
|
|
changed = true;
|
|
tx.commit();
|
|
} else {
|
|
changed = false;
|
|
tx.rollback();
|
|
}
|
|
} finally {
|
|
tx.undoGetForUpdate(cfh, keyArray);
|
|
}
|
|
recordAtomicUpdateTime(changed, prevData != null, newData != null, initNanoTime);
|
|
return switch (returnMode) {
|
|
case NOTHING -> {
|
|
if (prevData != null) {
|
|
prevData.close();
|
|
}
|
|
if (newData != null) {
|
|
newData.close();
|
|
}
|
|
yield RESULT_NOTHING;
|
|
}
|
|
case CURRENT -> {
|
|
if (prevData != null) {
|
|
prevData.close();
|
|
}
|
|
yield new UpdateAtomicResultCurrent(newData);
|
|
}
|
|
case PREVIOUS -> {
|
|
if (newData != null) {
|
|
newData.close();
|
|
}
|
|
yield new UpdateAtomicResultPrevious(prevData);
|
|
}
|
|
case BINARY_CHANGED -> {
|
|
if (prevData != null) {
|
|
prevData.close();
|
|
}
|
|
if (newData != null) {
|
|
newData.close();
|
|
}
|
|
yield new UpdateAtomicResultBinaryChanged(changed);
|
|
}
|
|
case DELTA -> new UpdateAtomicResultDelta(LLDelta.of(prevData, newData));
|
|
};
|
|
} catch (Throwable ex) {
|
|
if (prevData != null && prevData.isAccessible()) {
|
|
prevData.close();
|
|
}
|
|
if (newData != null && newData.isAccessible()) {
|
|
newData.close();
|
|
}
|
|
throw ex;
|
|
}
|
|
}
|
|
} catch (Throwable ex) {
|
|
throw new IOException("Failed to update key " + LLUtils.toStringSafe(key), ex);
|
|
}
|
|
}
|
|
|
|
@Override
|
|
public boolean supportsTransactions() {
|
|
return true;
|
|
}
|
|
}
|