package it.cavallium.dbengine.database.disk; import static it.cavallium.dbengine.database.LLUtils.MARKER_ROCKSDB; import io.micrometer.core.instrument.MeterRegistry; import io.netty5.buffer.api.Buffer; import io.netty5.buffer.api.BufferAllocator; import io.netty5.buffer.api.MemoryManager; import io.netty5.util.Send; import it.cavallium.dbengine.database.LLDelta; import it.cavallium.dbengine.database.LLUtils; import java.io.IOException; import java.util.concurrent.locks.Lock; import java.util.concurrent.locks.StampedLock; import org.jetbrains.annotations.NotNull; import org.jetbrains.annotations.Nullable; import org.rocksdb.ColumnFamilyHandle; import org.rocksdb.ReadOptions; import org.rocksdb.RocksDBException; import org.rocksdb.Transaction; import org.rocksdb.TransactionDB; import org.rocksdb.TransactionOptions; import org.rocksdb.WriteOptions; import reactor.core.scheduler.Schedulers; public final class PessimisticRocksDBColumn extends AbstractRocksDBColumn { private static final TransactionOptions DEFAULT_TX_OPTIONS = new TransactionOptions(); public PessimisticRocksDBColumn(TransactionDB db, boolean nettyDirect, BufferAllocator alloc, String dbName, ColumnFamilyHandle cfh, MeterRegistry meterRegistry, StampedLock closeLock) { super(db, nettyDirect, alloc, dbName, cfh, meterRegistry, closeLock); } @Override protected boolean commitOptimistically(Transaction tx) throws RocksDBException { tx.commit(); return true; } @Override protected Transaction beginTransaction(@NotNull WriteOptions writeOptions, TransactionOptions txOpts) { return getDb().beginTransaction(writeOptions, txOpts); } @Override public @NotNull UpdateAtomicResult updateAtomicImpl(@NotNull ReadOptions readOptions, @NotNull WriteOptions writeOptions, Buffer key, BinarySerializationFunction updater, UpdateAtomicResultMode returnMode) throws IOException { long initNanoTime = System.nanoTime(); try { var cfh = getCfh(); var keyArray = LLUtils.toArray(key); if (Schedulers.isInNonBlockingThread()) { throw new UnsupportedOperationException("Called update in a nonblocking thread"); } try (var txOpts = new TransactionOptions(); var tx = beginTransaction(writeOptions, txOpts)) { Buffer prevData = null; Buffer newData = null; try { boolean changed; if (logger.isTraceEnabled()) { logger.trace(MARKER_ROCKSDB, "Reading {} (before update lock)", LLUtils.toStringSafe(key)); } var prevDataArray = tx.getForUpdate(readOptions, cfh, keyArray, true); try { if (logger.isTraceEnabled()) { logger.trace(MARKER_ROCKSDB, "Reading {}: {} (before update)", LLUtils.toStringSafe(key), LLUtils.toStringSafe(prevDataArray) ); } if (prevDataArray != null) { readValueFoundWithoutBloomBufferSize.record(prevDataArray.length); prevData = MemoryManager.unsafeWrap(prevDataArray); } else { readValueNotFoundWithoutBloomBufferSize.record(0); } Buffer prevDataToSendToUpdater; if (prevData != null) { prevDataToSendToUpdater = prevData.copy().makeReadOnly(); } else { prevDataToSendToUpdater = null; } try { newData = updater.apply(prevDataToSendToUpdater); } finally { if (prevDataToSendToUpdater != null && prevDataToSendToUpdater.isAccessible()) { prevDataToSendToUpdater.close(); } } var newDataArray = newData == null ? null : LLUtils.toArray(newData); if (logger.isTraceEnabled()) { logger.trace(MARKER_ROCKSDB, "Updating {}. previous data: {}, updated data: {}", LLUtils.toStringSafe(key), LLUtils.toStringSafe(prevDataArray), LLUtils.toStringSafe(newDataArray) ); } if (prevData != null && newData == null) { if (logger.isTraceEnabled()) { logger.trace(MARKER_ROCKSDB, "Deleting {} (after update)", LLUtils.toStringSafe(key)); } writeValueBufferSize.record(0); tx.delete(cfh, keyArray, true); changed = true; tx.commit(); } else if (newData != null && (prevData == null || !LLUtils.equals(prevData, newData))) { if (logger.isTraceEnabled()) { logger.trace(MARKER_ROCKSDB, "Writing {}: {} (after update)", LLUtils.toStringSafe(key), LLUtils.toStringSafe(newData) ); } writeValueBufferSize.record(newDataArray.length); tx.put(cfh, keyArray, newDataArray); changed = true; tx.commit(); } else { changed = false; tx.rollback(); } } finally { tx.undoGetForUpdate(cfh, keyArray); } recordAtomicUpdateTime(changed, prevData != null, newData != null, initNanoTime); return switch (returnMode) { case NOTHING -> { if (prevData != null) { prevData.close(); } if (newData != null) { newData.close(); } yield RESULT_NOTHING; } case CURRENT -> { if (prevData != null) { prevData.close(); } yield new UpdateAtomicResultCurrent(newData); } case PREVIOUS -> { if (newData != null) { newData.close(); } yield new UpdateAtomicResultPrevious(prevData); } case BINARY_CHANGED -> { if (prevData != null) { prevData.close(); } if (newData != null) { newData.close(); } yield new UpdateAtomicResultBinaryChanged(changed); } case DELTA -> new UpdateAtomicResultDelta(LLDelta.of(prevData, newData)); }; } catch (Throwable ex) { if (prevData != null && prevData.isAccessible()) { prevData.close(); } if (newData != null && newData.isAccessible()) { newData.close(); } throw ex; } } } catch (Throwable ex) { throw new IOException("Failed to update key " + LLUtils.toStringSafe(key), ex); } } @Override public boolean supportsTransactions() { return true; } }