Move uid lock into LiveVersionMap (#27905)
While the LiveVersionMap is an internal class that belongs to the engine we do rely on some external locking to enforce the desired semantics. Yet, in tests we mimic the outer locking but we don't have any way to enforce or assert on that the lock is actually hold. This change moves the KeyedLock inside the LiveVersionMap that allows the engine to access it as before but enables assertions in the LiveVersionMap to ensure the lock for the modifying or reading key is actually hold.
This commit is contained in:
parent
8b2eee39f0
commit
0779af6dd2
|
@ -117,8 +117,6 @@ public class InternalEngine extends Engine {
|
|||
// we use the hashed variant since we iterate over it and check removal and additions on existing keys
|
||||
private final LiveVersionMap versionMap = new LiveVersionMap();
|
||||
|
||||
private final KeyedLock<BytesRef> keyedLock = new KeyedLock<>();
|
||||
|
||||
private volatile SegmentInfos lastCommittedSegmentInfos;
|
||||
|
||||
private final IndexThrottle throttle;
|
||||
|
@ -551,7 +549,11 @@ public class InternalEngine extends Engine {
|
|||
ensureOpen();
|
||||
SearcherScope scope;
|
||||
if (get.realtime()) {
|
||||
VersionValue versionValue = getVersionFromMap(get.uid().bytes());
|
||||
VersionValue versionValue = null;
|
||||
try (Releasable ignore = versionMap.acquireLock(get.uid().bytes())) {
|
||||
// we need to lock here to access the version map to do this truly in RT
|
||||
versionValue = getVersionFromMap(get.uid().bytes());
|
||||
}
|
||||
if (versionValue != null) {
|
||||
if (versionValue.isDelete()) {
|
||||
return GetResult.NOT_EXISTS;
|
||||
|
@ -733,7 +735,7 @@ public class InternalEngine extends Engine {
|
|||
ensureOpen();
|
||||
assert assertIncomingSequenceNumber(index.origin(), index.seqNo());
|
||||
assert assertVersionType(index);
|
||||
try (Releasable ignored = acquireLock(index.uid());
|
||||
try (Releasable ignored = versionMap.acquireLock(index.uid().bytes());
|
||||
Releasable indexThrottle = doThrottle ? () -> {} : throttle.acquireThrottle()) {
|
||||
lastWriteNanos = index.startTime();
|
||||
/* A NOTE ABOUT APPEND ONLY OPTIMIZATIONS:
|
||||
|
@ -1059,7 +1061,7 @@ public class InternalEngine extends Engine {
|
|||
assert assertIncomingSequenceNumber(delete.origin(), delete.seqNo());
|
||||
final DeleteResult deleteResult;
|
||||
// NOTE: we don't throttle this when merges fall behind because delete-by-id does not create new segments:
|
||||
try (ReleasableLock ignored = readLock.acquire(); Releasable ignored2 = acquireLock(delete.uid())) {
|
||||
try (ReleasableLock ignored = readLock.acquire(); Releasable ignored2 = versionMap.acquireLock(delete.uid().bytes())) {
|
||||
ensureOpen();
|
||||
lastWriteNanos = delete.startTime();
|
||||
final DeletionStrategy plan;
|
||||
|
@ -1520,7 +1522,8 @@ public class InternalEngine extends Engine {
|
|||
// we only need to prune the deletes map; the current/old version maps are cleared on refresh:
|
||||
for (Map.Entry<BytesRef, DeleteVersionValue> entry : versionMap.getAllTombstones()) {
|
||||
BytesRef uid = entry.getKey();
|
||||
try (Releasable ignored = acquireLock(uid)) { // can we do it without this lock on each value? maybe batch to a set and get the lock once per set?
|
||||
try (Releasable ignored = versionMap.acquireLock(uid)) {
|
||||
// can we do it without this lock on each value? maybe batch to a set and get the lock once per set?
|
||||
|
||||
// Must re-get it here, vs using entry.getValue(), in case the uid was indexed/deleted since we pulled the iterator:
|
||||
DeleteVersionValue versionValue = versionMap.getTombstoneUnderLock(uid);
|
||||
|
@ -1767,14 +1770,6 @@ public class InternalEngine extends Engine {
|
|||
}
|
||||
}
|
||||
|
||||
private Releasable acquireLock(BytesRef uid) {
|
||||
return keyedLock.acquire(uid);
|
||||
}
|
||||
|
||||
private Releasable acquireLock(Term uid) {
|
||||
return acquireLock(uid.bytes());
|
||||
}
|
||||
|
||||
private long loadCurrentVersionFromIndex(Term uid) throws IOException {
|
||||
assert incrementIndexVersionLookup();
|
||||
try (Searcher searcher = acquireSearcher("load_version", SearcherScope.INTERNAL)) {
|
||||
|
|
|
@ -23,7 +23,9 @@ import org.apache.lucene.search.ReferenceManager;
|
|||
import org.apache.lucene.util.Accountable;
|
||||
import org.apache.lucene.util.BytesRef;
|
||||
import org.apache.lucene.util.RamUsageEstimator;
|
||||
import org.elasticsearch.common.lease.Releasable;
|
||||
import org.elasticsearch.common.util.concurrent.ConcurrentCollections;
|
||||
import org.elasticsearch.common.util.concurrent.KeyedLock;
|
||||
|
||||
import java.io.IOException;
|
||||
import java.util.Collection;
|
||||
|
@ -34,6 +36,8 @@ import java.util.concurrent.atomic.AtomicLong;
|
|||
/** Maps _uid value to its version information. */
|
||||
final class LiveVersionMap implements ReferenceManager.RefreshListener, Accountable {
|
||||
|
||||
private final KeyedLock<BytesRef> keyedLock = new KeyedLock<>();
|
||||
|
||||
/**
|
||||
* Resets the internal map and adjusts it's capacity as if there were no indexing operations.
|
||||
* This must be called under write lock in the engine
|
||||
|
@ -151,12 +155,14 @@ final class LiveVersionMap implements ReferenceManager.RefreshListener, Accounta
|
|||
// this map is only maintained if assertions are enabled
|
||||
private volatile Maps unsafeKeysMap = new Maps();
|
||||
|
||||
/** Bytes consumed for each BytesRef UID:
|
||||
/**
|
||||
* Bytes consumed for each BytesRef UID:
|
||||
* In this base value, we account for the {@link BytesRef} object itself as
|
||||
* well as the header of the byte[] array it holds, and some lost bytes due
|
||||
* to object alignment. So consumers of this constant just have to add the
|
||||
* length of the byte[] (assuming it is not shared between multiple
|
||||
* instances). */
|
||||
* instances).
|
||||
*/
|
||||
private static final long BASE_BYTES_PER_BYTESREF =
|
||||
// shallow memory usage of the BytesRef object
|
||||
RamUsageEstimator.shallowSizeOfInstance(BytesRef.class) +
|
||||
|
@ -167,8 +173,11 @@ final class LiveVersionMap implements ReferenceManager.RefreshListener, Accounta
|
|||
// lost bytes on average
|
||||
3;
|
||||
|
||||
/** Bytes used by having CHM point to a key/value. */
|
||||
/**
|
||||
* Bytes used by having CHM point to a key/value.
|
||||
*/
|
||||
private static final long BASE_BYTES_PER_CHM_ENTRY;
|
||||
|
||||
static {
|
||||
// use the same impl as the Maps does
|
||||
Map<Integer, Integer> map = ConcurrentCollections.newConcurrentMapWithAggressiveConcurrency();
|
||||
|
@ -181,11 +190,15 @@ final class LiveVersionMap implements ReferenceManager.RefreshListener, Accounta
|
|||
BASE_BYTES_PER_CHM_ENTRY = chmEntryShallowSize + 2 * RamUsageEstimator.NUM_BYTES_OBJECT_REF;
|
||||
}
|
||||
|
||||
/** Tracks bytes used by current map, i.e. what is freed on refresh. For deletes, which are also added to tombstones, we only account
|
||||
* for the CHM entry here, and account for BytesRef/VersionValue against the tombstones, since refresh would not clear this RAM. */
|
||||
/**
|
||||
* Tracks bytes used by current map, i.e. what is freed on refresh. For deletes, which are also added to tombstones, we only account
|
||||
* for the CHM entry here, and account for BytesRef/VersionValue against the tombstones, since refresh would not clear this RAM.
|
||||
*/
|
||||
final AtomicLong ramBytesUsedCurrent = new AtomicLong();
|
||||
|
||||
/** Tracks bytes used by tombstones (deletes) */
|
||||
/**
|
||||
* Tracks bytes used by tombstones (deletes)
|
||||
*/
|
||||
final AtomicLong ramBytesUsedTombstones = new AtomicLong();
|
||||
|
||||
@Override
|
||||
|
@ -215,12 +228,15 @@ final class LiveVersionMap implements ReferenceManager.RefreshListener, Accounta
|
|||
|
||||
}
|
||||
|
||||
/** Returns the live version (add or delete) for this uid. */
|
||||
/**
|
||||
* Returns the live version (add or delete) for this uid.
|
||||
*/
|
||||
VersionValue getUnderLock(final BytesRef uid) {
|
||||
return getUnderLock(uid, maps);
|
||||
}
|
||||
|
||||
private VersionValue getUnderLock(final BytesRef uid, Maps currentMaps) {
|
||||
assert keyedLock.isHeldByCurrentThread(uid);
|
||||
// First try to get the "live" value:
|
||||
VersionValue value = currentMaps.current.get(uid);
|
||||
if (value != null) {
|
||||
|
@ -255,8 +271,11 @@ final class LiveVersionMap implements ReferenceManager.RefreshListener, Accounta
|
|||
return maps.isSafeAccessMode();
|
||||
}
|
||||
|
||||
/** Adds this uid/version to the pending adds map iff the map needs safe access. */
|
||||
/**
|
||||
* Adds this uid/version to the pending adds map iff the map needs safe access.
|
||||
*/
|
||||
void maybePutUnderLock(BytesRef uid, VersionValue version) {
|
||||
assert keyedLock.isHeldByCurrentThread(uid);
|
||||
Maps maps = this.maps;
|
||||
if (maps.isSafeAccessMode()) {
|
||||
putUnderLock(uid, version, maps);
|
||||
|
@ -271,14 +290,19 @@ final class LiveVersionMap implements ReferenceManager.RefreshListener, Accounta
|
|||
return true;
|
||||
}
|
||||
|
||||
/** Adds this uid/version to the pending adds map. */
|
||||
/**
|
||||
* Adds this uid/version to the pending adds map.
|
||||
*/
|
||||
void putUnderLock(BytesRef uid, VersionValue version) {
|
||||
Maps maps = this.maps;
|
||||
putUnderLock(uid, version, maps);
|
||||
}
|
||||
|
||||
/** Adds this uid/version to the pending adds map. */
|
||||
/**
|
||||
* Adds this uid/version to the pending adds map.
|
||||
*/
|
||||
private void putUnderLock(BytesRef uid, VersionValue version, Maps maps) {
|
||||
assert keyedLock.isHeldByCurrentThread(uid);
|
||||
assert uid.bytes.length == uid.length : "Oversized _uid! UID length: " + uid.length + ", bytes length: " + uid.bytes.length;
|
||||
long uidRAMBytesUsed = BASE_BYTES_PER_BYTESREF + uid.bytes.length;
|
||||
final VersionValue prev = maps.current.put(uid, version);
|
||||
|
@ -325,9 +349,11 @@ final class LiveVersionMap implements ReferenceManager.RefreshListener, Accounta
|
|||
}
|
||||
}
|
||||
|
||||
/** Removes this uid from the pending deletes map. */
|
||||
/**
|
||||
* Removes this uid from the pending deletes map.
|
||||
*/
|
||||
void removeTombstoneUnderLock(BytesRef uid) {
|
||||
|
||||
assert keyedLock.isHeldByCurrentThread(uid);
|
||||
long uidRAMBytesUsed = BASE_BYTES_PER_BYTESREF + uid.bytes.length;
|
||||
|
||||
final VersionValue prev = tombstones.remove(uid);
|
||||
|
@ -345,22 +371,31 @@ final class LiveVersionMap implements ReferenceManager.RefreshListener, Accounta
|
|||
}
|
||||
}
|
||||
|
||||
/** Caller has a lock, so that this uid will not be concurrently added/deleted by another thread. */
|
||||
/**
|
||||
* Caller has a lock, so that this uid will not be concurrently added/deleted by another thread.
|
||||
*/
|
||||
DeleteVersionValue getTombstoneUnderLock(BytesRef uid) {
|
||||
assert keyedLock.isHeldByCurrentThread(uid);
|
||||
return tombstones.get(uid);
|
||||
}
|
||||
|
||||
/** Iterates over all deleted versions, including new ones (not yet exposed via reader) and old ones (exposed via reader but not yet GC'd). */
|
||||
/**
|
||||
* Iterates over all deleted versions, including new ones (not yet exposed via reader) and old ones (exposed via reader but not yet GC'd).
|
||||
*/
|
||||
Iterable<Map.Entry<BytesRef, DeleteVersionValue>> getAllTombstones() {
|
||||
return tombstones.entrySet();
|
||||
}
|
||||
|
||||
/** clears all tombstones ops */
|
||||
/**
|
||||
* clears all tombstones ops
|
||||
*/
|
||||
void clearTombstones() {
|
||||
tombstones.clear();
|
||||
}
|
||||
|
||||
/** Called when this index is closed. */
|
||||
/**
|
||||
* Called when this index is closed.
|
||||
*/
|
||||
synchronized void clear() {
|
||||
maps = new Maps();
|
||||
tombstones.clear();
|
||||
|
@ -377,8 +412,10 @@ final class LiveVersionMap implements ReferenceManager.RefreshListener, Accounta
|
|||
return ramBytesUsedCurrent.get() + ramBytesUsedTombstones.get();
|
||||
}
|
||||
|
||||
/** Returns how much RAM would be freed up by refreshing. This is {@link #ramBytesUsed} except does not include tombstones because they
|
||||
* don't clear on refresh. */
|
||||
/**
|
||||
* Returns how much RAM would be freed up by refreshing. This is {@link #ramBytesUsed} except does not include tombstones because they
|
||||
* don't clear on refresh.
|
||||
*/
|
||||
long ramBytesUsedForRefresh() {
|
||||
return ramBytesUsedCurrent.get();
|
||||
}
|
||||
|
@ -389,7 +426,20 @@ final class LiveVersionMap implements ReferenceManager.RefreshListener, Accounta
|
|||
return Collections.emptyList();
|
||||
}
|
||||
|
||||
/** Returns the current internal versions as a point in time snapshot*/
|
||||
/**
|
||||
* Returns the current internal versions as a point in time snapshot
|
||||
*/
|
||||
Map<BytesRef, VersionValue> getAllCurrent() {
|
||||
return maps.current.map;
|
||||
}}
|
||||
}
|
||||
|
||||
/**
|
||||
* Acquires a releaseable lock for the given uId. All *UnderLock methods require
|
||||
* this lock to be hold by the caller otherwise the visibility guarantees of this version
|
||||
* map are broken. We assert on this lock to be hold when calling these methods.
|
||||
* @see KeyedLock
|
||||
*/
|
||||
Releasable acquireLock(BytesRef uid) {
|
||||
return keyedLock.acquire(uid);
|
||||
}
|
||||
}
|
||||
|
|
|
@ -47,8 +47,10 @@ public class LiveVersionMapTests extends ESTestCase {
|
|||
BytesRefBuilder uid = new BytesRefBuilder();
|
||||
uid.copyChars(TestUtil.randomSimpleString(random(), 10, 20));
|
||||
VersionValue version = new VersionValue(randomLong(), randomLong(), randomLong());
|
||||
try (Releasable r = map.acquireLock(uid.toBytesRef())) {
|
||||
map.putUnderLock(uid.toBytesRef(), version);
|
||||
}
|
||||
}
|
||||
long actualRamBytesUsed = RamUsageTester.sizeOf(map);
|
||||
long estimatedRamBytesUsed = map.ramBytesUsed();
|
||||
// less than 50% off
|
||||
|
@ -62,8 +64,10 @@ public class LiveVersionMapTests extends ESTestCase {
|
|||
BytesRefBuilder uid = new BytesRefBuilder();
|
||||
uid.copyChars(TestUtil.randomSimpleString(random(), 10, 20));
|
||||
VersionValue version = new VersionValue(randomLong(), randomLong(), randomLong());
|
||||
try (Releasable r = map.acquireLock(uid.toBytesRef())) {
|
||||
map.putUnderLock(uid.toBytesRef(), version);
|
||||
}
|
||||
}
|
||||
actualRamBytesUsed = RamUsageTester.sizeOf(map);
|
||||
estimatedRamBytesUsed = map.ramBytesUsed();
|
||||
// less than 25% off
|
||||
|
@ -79,14 +83,13 @@ public class LiveVersionMapTests extends ESTestCase {
|
|||
|
||||
public void testBasics() throws IOException {
|
||||
LiveVersionMap map = new LiveVersionMap();
|
||||
try (Releasable r = map.acquireLock(uid("test"))) {
|
||||
map.putUnderLock(uid("test"), new VersionValue(1, 1, 1));
|
||||
assertEquals(new VersionValue(1, 1, 1), map.getUnderLock(uid("test")));
|
||||
map.beforeRefresh();
|
||||
assertEquals(new VersionValue(1, 1, 1), map.getUnderLock(uid("test")));
|
||||
map.afterRefresh(randomBoolean());
|
||||
assertNull(map.getUnderLock(uid("test")));
|
||||
|
||||
|
||||
map.putUnderLock(uid("test"), new DeleteVersionValue(1, 1, 1, Long.MAX_VALUE));
|
||||
assertEquals(new DeleteVersionValue(1, 1, 1, Long.MAX_VALUE), map.getUnderLock(uid("test")));
|
||||
map.beforeRefresh();
|
||||
|
@ -96,16 +99,21 @@ public class LiveVersionMapTests extends ESTestCase {
|
|||
map.removeTombstoneUnderLock(uid("test"));
|
||||
assertNull(map.getUnderLock(uid("test")));
|
||||
}
|
||||
}
|
||||
|
||||
|
||||
public void testAdjustMapSizeUnderLock() throws IOException {
|
||||
LiveVersionMap map = new LiveVersionMap();
|
||||
try (Releasable r = map.acquireLock(uid("test"))) {
|
||||
map.putUnderLock(uid("test"), new VersionValue(1, 1, 1));
|
||||
}
|
||||
boolean withinRefresh = randomBoolean();
|
||||
if (withinRefresh) {
|
||||
map.beforeRefresh();
|
||||
}
|
||||
try (Releasable r = map.acquireLock(uid("test"))) {
|
||||
assertEquals(new VersionValue(1, 1, 1), map.getUnderLock(uid("test")));
|
||||
}
|
||||
final String msg;
|
||||
if (Assertions.ENABLED) {
|
||||
msg = expectThrows(AssertionError.class, map::adjustMapSizeUnderLock).getMessage();
|
||||
|
@ -113,7 +121,9 @@ public class LiveVersionMapTests extends ESTestCase {
|
|||
msg = expectThrows(IllegalStateException.class, map::adjustMapSizeUnderLock).getMessage();
|
||||
}
|
||||
assertEquals("map must be empty", msg);
|
||||
try (Releasable r = map.acquireLock(uid("test"))) {
|
||||
assertEquals(new VersionValue(1, 1, 1), map.getUnderLock(uid("test")));
|
||||
}
|
||||
if (withinRefresh == false) {
|
||||
map.beforeRefresh();
|
||||
}
|
||||
|
@ -131,7 +141,6 @@ public class LiveVersionMapTests extends ESTestCase {
|
|||
}
|
||||
List<BytesRef> keyList = new ArrayList<>(keySet);
|
||||
ConcurrentHashMap<BytesRef, VersionValue> values = new ConcurrentHashMap<>();
|
||||
KeyedLock<BytesRef> keyedLock = new KeyedLock<>();
|
||||
LiveVersionMap map = new LiveVersionMap();
|
||||
int numThreads = randomIntBetween(2, 5);
|
||||
|
||||
|
@ -151,7 +160,7 @@ public class LiveVersionMapTests extends ESTestCase {
|
|||
try {
|
||||
for (int i = 0; i < randomValuesPerThread; ++i) {
|
||||
BytesRef bytesRef = randomFrom(random(), keyList);
|
||||
try (Releasable r = keyedLock.acquire(bytesRef)) {
|
||||
try (Releasable r = map.acquireLock(bytesRef)) {
|
||||
VersionValue versionValue = values.computeIfAbsent(bytesRef,
|
||||
v -> new VersionValue(randomLong(), randomLong(), randomLong()));
|
||||
boolean isDelete = versionValue instanceof DeleteVersionValue;
|
||||
|
@ -180,12 +189,15 @@ public class LiveVersionMapTests extends ESTestCase {
|
|||
Map<BytesRef, VersionValue> valueMap = new HashMap<>(map.getAllCurrent());
|
||||
map.beforeRefresh();
|
||||
valueMap.forEach((k, v) -> {
|
||||
try (Releasable r = map.acquireLock(k)) {
|
||||
VersionValue actualValue = map.getUnderLock(k);
|
||||
assertNotNull(actualValue);
|
||||
assertTrue(v.version <= actualValue.version);
|
||||
}
|
||||
});
|
||||
map.afterRefresh(randomBoolean());
|
||||
valueMap.forEach((k, v) -> {
|
||||
try (Releasable r = map.acquireLock(k)) {
|
||||
VersionValue actualValue = map.getUnderLock(k);
|
||||
if (actualValue != null) {
|
||||
if (actualValue instanceof DeleteVersionValue) {
|
||||
|
@ -195,6 +207,7 @@ public class LiveVersionMapTests extends ESTestCase {
|
|||
}
|
||||
|
||||
}
|
||||
}
|
||||
});
|
||||
if (randomBoolean()) {
|
||||
Thread.yield();
|
||||
|
@ -232,7 +245,9 @@ public class LiveVersionMapTests extends ESTestCase {
|
|||
assertTrue("failed in iter: " + i, map.isSafeAccessRequired());
|
||||
}
|
||||
|
||||
try (Releasable r = map.acquireLock(uid(""))) {
|
||||
map.maybePutUnderLock(new BytesRef(""), new VersionValue(randomLong(), randomLong(), randomLong()));
|
||||
}
|
||||
assertFalse(map.isUnsafe());
|
||||
assertEquals(1, map.getAllCurrent().size());
|
||||
|
||||
|
@ -240,8 +255,9 @@ public class LiveVersionMapTests extends ESTestCase {
|
|||
map.afterRefresh(randomBoolean());
|
||||
assertFalse(map.isUnsafe());
|
||||
assertFalse(map.isSafeAccessRequired());
|
||||
|
||||
try (Releasable r = map.acquireLock(uid(""))) {
|
||||
map.maybePutUnderLock(new BytesRef(""), new VersionValue(randomLong(), randomLong(), randomLong()));
|
||||
}
|
||||
assertTrue(map.isUnsafe());
|
||||
assertFalse(map.isSafeAccessRequired());
|
||||
assertEquals(0, map.getAllCurrent().size());
|
||||
|
@ -249,6 +265,7 @@ public class LiveVersionMapTests extends ESTestCase {
|
|||
|
||||
public void testRefreshTransition() throws IOException {
|
||||
LiveVersionMap map = new LiveVersionMap();
|
||||
try (Releasable r = map.acquireLock(uid("1"))) {
|
||||
map.maybePutUnderLock(uid("1"), new VersionValue(randomLong(), randomLong(), randomLong()));
|
||||
assertTrue(map.isUnsafe());
|
||||
assertNull(map.getUnderLock(uid("1")));
|
||||
|
@ -273,3 +290,4 @@ public class LiveVersionMapTests extends ESTestCase {
|
|||
assertTrue(map.isSafeAccessRequired());
|
||||
}
|
||||
}
|
||||
}
|
||||
|
|
Loading…
Reference in New Issue