carp84 commented on a change in pull request #9501: [FLINK-12697] [State Backends] Support on-disk state storage for spill-able heap backend URL: https://github.com/apache/flink/pull/9501#discussion_r329036607
########## File path: flink-state-backends/flink-statebackend-heap-spillable/src/test/java/org/apache/flink/runtime/state/heap/CopyOnWriteSkipListStateMapTest.java ########## @@ -0,0 +1,1448 @@ +/* + * + * * Licensed to the Apache Software Foundation (ASF) under one + * * or more contributor license agreements. See the NOTICE file + * * distributed with this work for additional information + * * regarding copyright ownership. The ASF licenses this file + * * to you under the Apache License, Version 2.0 (the + * * "License"); you may not use this file except in compliance + * * with the License. You may obtain a copy of the License at + * * + * * http://www.apache.org/licenses/LICENSE-2.0 + * * + * * Unless required by applicable law or agreed to in writing, software + * * distributed under the License is distributed on an "AS IS" BASIS, + * * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + * * See the License for the specific language governing permissions and + * * limitations under the License. + * + */ + +package org.apache.flink.runtime.state.heap; + +import org.apache.flink.api.common.typeutils.TypeSerializer; +import org.apache.flink.api.common.typeutils.base.IntSerializer; +import org.apache.flink.api.common.typeutils.base.LongSerializer; +import org.apache.flink.api.common.typeutils.base.StringSerializer; +import org.apache.flink.core.memory.ByteArrayInputStreamWithPos; +import org.apache.flink.core.memory.ByteArrayOutputStreamWithPos; +import org.apache.flink.core.memory.DataInputView; +import org.apache.flink.core.memory.DataInputViewStreamWrapper; +import org.apache.flink.core.memory.DataOutputView; +import org.apache.flink.core.memory.DataOutputViewStreamWrapper; +import org.apache.flink.runtime.state.StateEntry; +import org.apache.flink.runtime.state.StateSnapshotTransformer; +import org.apache.flink.runtime.state.StateTransformationFunction; +import org.apache.flink.runtime.state.heap.space.Allocator; +import org.apache.flink.runtime.state.internal.InternalKvState; +import org.apache.flink.util.IOUtils; +import org.apache.flink.util.TestLogger; + +import org.junit.After; +import org.junit.Assert; +import org.junit.Before; +import org.junit.Test; + +import javax.annotation.Nullable; + +import java.io.IOException; +import java.nio.ByteBuffer; +import java.util.ArrayList; +import java.util.Collection; +import java.util.HashMap; +import java.util.HashSet; +import java.util.Iterator; +import java.util.List; +import java.util.Map; +import java.util.Set; +import java.util.concurrent.ThreadLocalRandom; + +import static org.apache.flink.runtime.state.heap.SkipListUtils.NIL_NODE; +import static org.hamcrest.Matchers.is; +import static org.junit.Assert.assertEquals; +import static org.junit.Assert.assertFalse; +import static org.junit.Assert.assertNull; +import static org.junit.Assert.assertTrue; + +/** + * Tests for {@link CopyOnWriteSkipListStateMap}. + */ +public class CopyOnWriteSkipListStateMapTest extends TestLogger { + + private TestAllocator spaceAllocator; + + @Before + public void setUp() { + int maxAllocateSize = 256; + spaceAllocator = new TestAllocator(maxAllocateSize); + } + + @After + public void tearDown() { + IOUtils.closeQuietly(spaceAllocator); + } + + /** + * Test initialization of state map. + */ + @Test + public void testInitStateMap() { + TypeSerializer<Integer> keySerializer = IntSerializer.INSTANCE; + TypeSerializer<Long> namespaceSerializer = LongSerializer.INSTANCE; + TypeSerializer<String> stateSerializer = StringSerializer.INSTANCE; + CopyOnWriteSkipListStateMap<Integer, Long, String> stateMap = new CopyOnWriteSkipListStateMap<>( + keySerializer, namespaceSerializer, stateSerializer, spaceAllocator); + + assertTrue(stateMap.isEmpty()); + assertEquals(0, stateMap.size()); + assertEquals(0, stateMap.totalSize()); + assertEquals(0, stateMap.getRequestCount()); + assertTrue(stateMap.getLogicallyRemovedNodes().isEmpty()); + assertEquals(0, stateMap.getHighestRequiredSnapshotVersion()); + assertEquals(0, stateMap.getHighestFinishedSnapshotVersion()); + assertTrue(stateMap.getSnapshotVersions().isEmpty()); + assertTrue(stateMap.getPruningValueNodes().isEmpty()); + assertEquals(0, stateMap.getResourceGuard().getLeaseCount()); + assertFalse(stateMap.getResourceGuard().isClosed()); + assertFalse(stateMap.isClosed()); + + assertNull(stateMap.get(0, 0L)); + assertFalse(stateMap.containsKey(1, 2L)); + assertNull(stateMap.removeAndGetOld(3, 4L)); + assertFalse(stateMap.getKeys(-92L).iterator().hasNext()); + assertEquals(0, stateMap.sizeOfNamespace(8L)); + assertFalse(stateMap.iterator().hasNext()); + assertFalse(stateMap.getStateIncrementalVisitor(100).hasNext()); + + stateMap.close(); + assertEquals(0, stateMap.size()); + assertEquals(0, stateMap.totalSize()); + assertTrue(stateMap.isClosed()); + } + + /** + * Test basic operations. + */ + @Test + public void testBasicOperations() throws Exception { + TypeSerializer<Integer> keySerializer = IntSerializer.INSTANCE; + TypeSerializer<Long> namespaceSerializer = LongSerializer.INSTANCE; + TypeSerializer<String> stateSerializer = StringSerializer.INSTANCE; + CopyOnWriteSkipListStateMap<Integer, Long, String> stateMap = new CopyOnWriteSkipListStateMap<>( + keySerializer, namespaceSerializer, stateSerializer, spaceAllocator); + + ThreadLocalRandom random = ThreadLocalRandom.current(); + // map to store expected states, namespace -> key -> state + Map<Long, Map<Integer, String>> referenceStates = new HashMap<>(); + int totalSize = 0; + + // put some states + for (long namespace = 0; namespace < 10; namespace++) { + for (int key = 0; key < 100; key++) { + totalSize++; + String state = String.valueOf(key * namespace); + if (random.nextBoolean()) { + stateMap.put(key, namespace, state); + } else { + assertNull(stateMap.putAndGetOld(key, namespace, state)); + } + referenceStates.computeIfAbsent(namespace, (none) -> new HashMap<>()).put(key, state); + assertEquals(totalSize, stateMap.size()); + assertEquals(totalSize, stateMap.totalSize()); + } + } + + // validates space allocation. Each pair need 2 spaces + assertEquals(totalSize * 2, spaceAllocator.getTotalSpaceNumber()); + verifyState(referenceStates, stateMap); + + // remove some states + Map<Long, Set<Integer>> removedStates = new HashMap<>(); + for (Map.Entry<Long, Map<Integer, String>> namespaceEntry : referenceStates.entrySet()) { + long namespace = namespaceEntry.getKey(); + for (Map.Entry<Integer, String> keyEntry : namespaceEntry.getValue().entrySet()) { + if (random.nextBoolean()) { + int key = keyEntry.getKey(); + String state = keyEntry.getValue(); + removedStates.computeIfAbsent(namespace, (none) -> new HashSet<>()).add(key); + totalSize--; + if (random.nextBoolean()) { + stateMap.remove(key, namespace); + } else { + assertEquals(state, stateMap.removeAndGetOld(key, namespace)); + } + assertEquals(totalSize, stateMap.size()); + assertEquals(totalSize, stateMap.totalSize()); + } + } + } + + for (Map.Entry<Long, Set<Integer>> entry : removedStates.entrySet()) { + long namespace = entry.getKey(); + Map<Integer, String> keyMap = referenceStates.get(namespace); + if (keyMap != null) { + entry.getValue().forEach(keyMap::remove); + if (keyMap.isEmpty()) { + referenceStates.remove(namespace); + } + } + for (int key : entry.getValue()) { + assertNull(stateMap.get(key, namespace)); + assertFalse(stateMap.containsKey(key, namespace)); + } + } + + assertEquals(totalSize * 2, spaceAllocator.getTotalSpaceNumber()); + verifyState(referenceStates, stateMap); + + // update some states + for (Map.Entry<Long, Map<Integer, String>> namespaceEntry : referenceStates.entrySet()) { + long namespace = namespaceEntry.getKey(); + for (Map.Entry<Integer, String> keyEntry : namespaceEntry.getValue().entrySet()) { + if (random.nextBoolean()) { + int key = keyEntry.getKey(); + String state = keyEntry.getValue(); + String newState = state + "-update"; + keyEntry.setValue(newState); + if (random.nextBoolean()) { + stateMap.put(key, namespace, newState); + } else { + assertEquals(state, stateMap.putAndGetOld(key, namespace, newState)); + } + assertEquals(totalSize, stateMap.size()); + assertEquals(totalSize, stateMap.totalSize()); + } + } + } + + // put some new states + for (long namespace = 10; namespace < 15; namespace++) { + for (int key = 0; key < 100; key++) { + totalSize++; + String state = String.valueOf(key * namespace); + if (random.nextBoolean()) { + stateMap.put(key, namespace, state); + } else { + assertNull(stateMap.putAndGetOld(key, namespace, state)); + } + referenceStates.computeIfAbsent(namespace, (none) -> new HashMap<>()).put(key, state); + assertEquals(totalSize, stateMap.size()); + assertEquals(totalSize, stateMap.totalSize()); + } + } + + // remove some absent states + for (Map.Entry<Long, Set<Integer>> entry : removedStates.entrySet()) { + long namespace = entry.getKey(); + for (int key : entry.getValue()) { + if (random.nextBoolean()) { + stateMap.remove(key, namespace); + } else { + assertNull(stateMap.removeAndGetOld(key, namespace)); + } + assertEquals(totalSize, stateMap.size()); + assertEquals(totalSize, stateMap.totalSize()); + } + } + + assertEquals(totalSize * 2, spaceAllocator.getTotalSpaceNumber()); + verifyState(referenceStates, stateMap); + + StateTransformationFunction<String, Integer> function = + (String prevState, Integer value) -> prevState == null ? String.valueOf(value) : prevState + value; + + // transform some old states + for (Map.Entry<Long, Map<Integer, String>> namespaceEntry : referenceStates.entrySet()) { + long namespace = namespaceEntry.getKey(); + for (Map.Entry<Integer, String> keyEntry : namespaceEntry.getValue().entrySet()) { + if (random.nextBoolean()) { + int key = keyEntry.getKey(); + String state = keyEntry.getValue(); + int delta = random.nextInt(); + String newState = function.apply(state, delta); + keyEntry.setValue(newState); + stateMap.transform(key, namespace, delta, function); + assertEquals(totalSize, stateMap.size()); + assertEquals(totalSize, stateMap.totalSize()); + } + } + } + + // transform some new states + for (long namespace = 15; namespace < 20; namespace++) { + for (int key = 0; key < 100; key++) { + totalSize++; + int value = (int) (key * namespace); + stateMap.transform(key, namespace, value, function); + referenceStates.computeIfAbsent(namespace, (none) -> new HashMap<>()).put(key, String.valueOf(value)); + assertEquals(totalSize, stateMap.size()); + assertEquals(totalSize, stateMap.totalSize()); + } + } + + assertEquals(totalSize * 2, spaceAllocator.getTotalSpaceNumber()); + verifyState(referenceStates, stateMap); + + // put some previously removed states + for (Map.Entry<Long, Set<Integer>> entry : removedStates.entrySet()) { + long namespace = entry.getKey(); + for (int key : entry.getValue()) { + totalSize++; + String state = String.valueOf(key * namespace); + if (random.nextBoolean()) { + stateMap.put(key, namespace, state); + } else { + assertNull(stateMap.putAndGetOld(key, namespace, state)); + } + referenceStates.computeIfAbsent(namespace, (none) -> new HashMap<>()).put(key, String.valueOf(state)); + assertEquals(totalSize, stateMap.size()); + assertEquals(totalSize, stateMap.totalSize()); + } + } + + assertEquals(totalSize * 2, spaceAllocator.getTotalSpaceNumber()); + verifyState(referenceStates, stateMap); + + // remove some namespaces + Set<Long> removedNamespaces = new HashSet<>(); + for (Map.Entry<Long, Map<Integer, String>> namespaceEntry : referenceStates.entrySet()) { + if (random.nextBoolean()) { + long namespace = namespaceEntry.getKey(); + removedNamespaces.add(namespace); + for (Map.Entry<Integer, String> keyEntry : namespaceEntry.getValue().entrySet()) { + int key = keyEntry.getKey(); + if (random.nextBoolean()) { + stateMap.remove(key, namespace); + } else { + assertEquals(keyEntry.getValue(), stateMap.removeAndGetOld(key, namespace)); + } + totalSize--; + assertEquals(totalSize, stateMap.size()); + assertEquals(totalSize, stateMap.totalSize()); + } + } + } + + for (long namespace : removedNamespaces) { + referenceStates.remove(namespace); + assertEquals(0, stateMap.sizeOfNamespace(namespace)); + assertFalse(stateMap.getKeys(namespace).iterator().hasNext()); + } + + assertEquals(totalSize * 2, spaceAllocator.getTotalSpaceNumber()); + verifyState(referenceStates, stateMap); + + stateMap.close(); + assertEquals(0, stateMap.size()); + assertEquals(0, stateMap.totalSize()); + // all spaces should be free + assertEquals(0, spaceAllocator.getTotalSpaceNumber()); + assertTrue(stateMap.isClosed()); + } + + /** + * Tests copy-on-write contracts. + */ + @SuppressWarnings("unchecked") + @Test + public void testCopyOnWriteContracts() throws IOException { + TypeSerializer<Integer> keySerializer = IntSerializer.INSTANCE; + TypeSerializer<Long> namespaceSerializer = LongSerializer.INSTANCE; + TypeSerializer<String> stateSerializer = StringSerializer.INSTANCE; + // do not remove states physically when get, put, remove and snapshot + CopyOnWriteSkipListStateMap<Integer, Long, String> stateMap = new CopyOnWriteSkipListStateMap<>( + keySerializer, + namespaceSerializer, + stateSerializer, + spaceAllocator, + 0, + 1.0f); + + StateSnapshotTransformer<String> transformer = new StateSnapshotTransformer<String>() { + @Nullable + @Override + public String filterOrTransform(@Nullable String value) { + if (value == null) { + return null; + } + int op = value.hashCode() % 3; + switch (op) { + case 0: + return null; + case 1: + return value + "-transform"; + default: + return value; + } + } + }; + + // map to store expected states, namespace -> key -> state + Map<Long, Map<Integer, String>> referenceStates = new HashMap<>(); + int totalStateSize = 0; + int totalSizeIncludingLogicalRemovedKey = 0; + int totalLogicallyRemovedKey = 0; + int totalSpaceNumber = 0; + + // take snapshot 1 which is an empty snapshot + Map<Long, Map<Integer, String>> expectedSnapshot1 = snapshotReferenceStates(referenceStates); + CopyOnWriteSkipListStateMapSnapshot<Integer, Long, String> snapshot1 = + (CopyOnWriteSkipListStateMapSnapshot<Integer, Long, String>) stateMap.stateSnapshot(); + assertEquals(1, stateMap.getHighestRequiredSnapshotVersion()); + assertEquals(1, stateMap.getSnapshotVersions().size()); + assertEquals(true, stateMap.getSnapshotVersions().contains(1)); + assertEquals(1, stateMap.getResourceGuard().getLeaseCount()); + verifySnapshotWithoutTransform( + expectedSnapshot1, snapshot1, keySerializer, namespaceSerializer, stateSerializer); + verifySnapshotWithTransform( + expectedSnapshot1, snapshot1, transformer, keySerializer, namespaceSerializer, stateSerializer); + + snapshot1.release(); + assertEquals(1, stateMap.getStateMapVersion()); + assertEquals(0, stateMap.getHighestRequiredSnapshotVersion()); + assertEquals(1, stateMap.getHighestFinishedSnapshotVersion()); + assertTrue(stateMap.getSnapshotVersions().isEmpty()); + assertEquals(0, stateMap.getResourceGuard().getLeaseCount()); + + // put some states + for (int i = 1; i <= 10; i++) { + totalStateSize++; + totalSizeIncludingLogicalRemovedKey++; + totalSpaceNumber += 2; + stateMap.put(i, (long) i, String.valueOf(i)); + addToReferenceState(referenceStates, i, (long) i, String.valueOf(i)); + } + + // take snapshot 2 + Map<Long, Map<Integer, String>> expectedSnapshot2 = snapshotReferenceStates(referenceStates); + CopyOnWriteSkipListStateMapSnapshot<Integer, Long, String> snapshot2 = + (CopyOnWriteSkipListStateMapSnapshot<Integer, Long, String>) stateMap.stateSnapshot(); + assertEquals(2, stateMap.getStateMapVersion()); + assertEquals(2, stateMap.getHighestRequiredSnapshotVersion()); + assertEquals(1, stateMap.getSnapshotVersions().size()); + assertEquals(true, stateMap.getSnapshotVersions().contains(2)); + assertEquals(1, stateMap.getResourceGuard().getLeaseCount()); + + // 1. test put -> put -> remove for (key 1, namespace 1) + + // put (key 1, namespace 1), and copy-on-write should happen + stateMap.put(1, 1L, String.valueOf("11")); + addToReferenceState(referenceStates, 1, 1L, "11"); + // a space for new value should be allocated + totalSpaceNumber += 1; + assertEquals(totalSpaceNumber, spaceAllocator.getTotalSpaceNumber()); + assertEquals("11", stateMap.get(1, 1L)); + assertTrue(stateMap.containsKey(1, 1L)); + assertEquals(totalStateSize, stateMap.size()); + verifyState(referenceStates, stateMap); + + // put (key 1, namespace 1) again, old value should be replaced and space will not increase + assertEquals("11", stateMap.putAndGetOld(1, 1L, String.valueOf("111"))); + addToReferenceState(referenceStates, 1, 1L, "111"); + assertEquals(totalSpaceNumber, spaceAllocator.getTotalSpaceNumber()); + assertEquals("111", stateMap.get(1, 1L)); + assertTrue(stateMap.containsKey(1, 1L)); + verifyState(referenceStates, stateMap); + + // remove (key 1, namespace 1) + stateMap.remove(1, 1L); + removeFromReferenceState(referenceStates, 1, 1L); + totalStateSize--; + totalLogicallyRemovedKey++; + assertEquals(totalSpaceNumber, spaceAllocator.getTotalSpaceNumber()); + assertNull(stateMap.get(1, 1L)); + assertFalse(stateMap.containsKey(1, 1L)); + assertEquals(totalStateSize, stateMap.size()); + assertEquals(totalSizeIncludingLogicalRemovedKey, stateMap.totalSize()); + assertEquals(totalLogicallyRemovedKey, stateMap.getLogicallyRemovedNodes().size()); + verifyState(referenceStates, stateMap); + + // 2. test remove -> remove -> put for (key 4, namespace 4) + + // remove (key 4, namespace 4), and it should be logically removed + assertEquals("4", stateMap.removeAndGetOld(4, 4L)); + removeFromReferenceState(referenceStates, 4, 4L); + // a space should be allocated + totalStateSize--; + totalLogicallyRemovedKey++; + totalSpaceNumber += 1; + assertEquals(totalSpaceNumber, spaceAllocator.getTotalSpaceNumber()); + assertNull(stateMap.get(4, 4L)); + assertFalse(stateMap.containsKey(4, 4L)); + assertEquals(totalStateSize, stateMap.size()); + assertEquals(totalSizeIncludingLogicalRemovedKey, stateMap.totalSize()); + assertEquals(totalLogicallyRemovedKey, stateMap.getLogicallyRemovedNodes().size()); + verifyState(referenceStates, stateMap); + + // remove (key 4, namespace 4) again, and nothing should happen + assertNull(stateMap.removeAndGetOld(4, 4L)); + assertEquals(totalSpaceNumber, spaceAllocator.getTotalSpaceNumber()); + assertEquals(totalStateSize, stateMap.size()); + assertEquals(totalSizeIncludingLogicalRemovedKey, stateMap.totalSize()); + assertEquals(totalLogicallyRemovedKey, stateMap.getLogicallyRemovedNodes().size()); + verifyState(referenceStates, stateMap); + + // put the logically removed (key 4, namespace 4) + assertNull(stateMap.putAndGetOld(4, 4L, "44")); + addToReferenceState(referenceStates, 4, 4L, "44"); + totalStateSize++; + totalLogicallyRemovedKey--; + assertEquals(totalSpaceNumber, spaceAllocator.getTotalSpaceNumber()); + assertEquals("44", stateMap.get(4, 4L)); + assertTrue(stateMap.containsKey(4, 4L)); + assertEquals(totalStateSize, stateMap.size()); + assertEquals(totalSizeIncludingLogicalRemovedKey, stateMap.totalSize()); + assertEquals(totalLogicallyRemovedKey, stateMap.getLogicallyRemovedNodes().size()); + verifyState(referenceStates, stateMap); + + // 3. test put -> remove -> put for (key 6, namespace 6) + + // put (key 6, namespace 6), and copy-on-write should happen + assertEquals("6", stateMap.putAndGetOld(6, 6L, String.valueOf("66"))); + addToReferenceState(referenceStates, 6, 6L, "66"); + // a space for new value should be allocated + totalSpaceNumber += 1; + assertEquals(totalSpaceNumber, spaceAllocator.getTotalSpaceNumber()); + assertEquals("66", stateMap.get(6, 6L)); + assertTrue(stateMap.containsKey(6, 6L)); + assertEquals(totalStateSize, stateMap.size()); + verifyState(referenceStates, stateMap); + + // remove (key 6, namespace 6), and it should be logically removed + assertEquals("66", stateMap.removeAndGetOld(6, 6L)); + removeFromReferenceState(referenceStates, 6, 6L); + totalStateSize--; + totalLogicallyRemovedKey++; + assertEquals(totalSpaceNumber, spaceAllocator.getTotalSpaceNumber()); + assertNull(stateMap.get(6, 6L)); + assertFalse(stateMap.containsKey(6, 6L)); + assertEquals(totalStateSize, stateMap.size()); + assertEquals(totalSizeIncludingLogicalRemovedKey, stateMap.totalSize()); + assertEquals(totalLogicallyRemovedKey, stateMap.getLogicallyRemovedNodes().size()); + verifyState(referenceStates, stateMap); + + // put (key 6, namespace 6) again + assertNull(stateMap.putAndGetOld(6, 6L, String.valueOf("666"))); + addToReferenceState(referenceStates, 6, 6L, "666"); + totalStateSize++; + totalLogicallyRemovedKey--; + assertEquals(totalSpaceNumber, spaceAllocator.getTotalSpaceNumber()); + assertEquals("666", stateMap.get(6, 6L)); + assertTrue(stateMap.containsKey(6, 6L)); + assertEquals(totalStateSize, stateMap.size()); + assertEquals(totalSizeIncludingLogicalRemovedKey, stateMap.totalSize()); + assertEquals(totalLogicallyRemovedKey, stateMap.getLogicallyRemovedNodes().size()); + verifyState(referenceStates, stateMap); + + assertEquals("3", stateMap.removeAndGetOld(3, 3L)); + removeFromReferenceState(referenceStates, 3, 3L); + assertEquals("5", stateMap.removeAndGetOld(5, 5L)); + removeFromReferenceState(referenceStates, 5, 5L); + assertEquals("7", stateMap.removeAndGetOld(7, 7L)); + removeFromReferenceState(referenceStates, 7, 7L); + totalStateSize -= 3; + totalLogicallyRemovedKey += 3; + totalSpaceNumber += 3; + + // access some (key, namespace) not in state + for (long namespace = 0; namespace < 15; namespace++) { + for (int key = 1; key < 10; key++) { + if (namespace != key) { + assertNull(stateMap.get(key, namespace)); + assertFalse(stateMap.containsKey(key, namespace)); + assertNull(stateMap.removeAndGetOld(key, namespace)); + stateMap.remove(key, namespace); + } + } + if (namespace > 10) { + assertEquals(0, stateMap.sizeOfNamespace(namespace)); + assertFalse(stateMap.getKeys(namespace).iterator().hasNext()); + } + } + verifyState(referenceStates, stateMap); + + // put some new states + for (long namespace = 0; namespace < 15; namespace++) { + for (int key = 1; key < 20; key++) { + if (namespace != key) { + String state = String.valueOf(namespace * key); + if (state.hashCode() % 2 == 0) { + stateMap.put(key, namespace, state); + } else { + assertNull(stateMap.putAndGetOld(key, namespace, state)); + } + addToReferenceState(referenceStates, key, namespace, state); + totalSizeIncludingLogicalRemovedKey++; + totalStateSize++; + totalSpaceNumber += 2; + } + } + } + + verifySnapshotWithoutTransform( + expectedSnapshot2, snapshot2, keySerializer, namespaceSerializer, stateSerializer); + snapshot2.release(); + + // there is no value to prune + assertEquals(totalSpaceNumber, spaceAllocator.getTotalSpaceNumber()); + assertEquals(totalStateSize, stateMap.size()); + assertEquals(totalLogicallyRemovedKey, stateMap.getLogicallyRemovedNodes().size()); + assertEquals(0, stateMap.getHighestRequiredSnapshotVersion()); + assertEquals(2, stateMap.getHighestFinishedSnapshotVersion()); + assertTrue(stateMap.getSnapshotVersions().isEmpty()); + assertEquals(0, stateMap.getResourceGuard().getLeaseCount()); + + // validates snapshot will not include logically removed states + Map<Long, Map<Integer, String>> expectedSnapshot3 = snapshotReferenceStates(referenceStates); + CopyOnWriteSkipListStateMapSnapshot<Integer, Long, String> snapshot3 = + (CopyOnWriteSkipListStateMapSnapshot<Integer, Long, String>) stateMap.stateSnapshot(); + assertEquals(3, stateMap.getStateMapVersion()); + assertEquals(3, stateMap.getHighestRequiredSnapshotVersion()); + assertEquals(1, stateMap.getSnapshotVersions().size()); + assertEquals(true, stateMap.getSnapshotVersions().contains(3)); + assertEquals(1, stateMap.getResourceGuard().getLeaseCount()); + + // verify that logically removed states are not deleted in sync part of snapshot + assertEquals(totalLogicallyRemovedKey, stateMap.getLogicallyRemovedNodes().size()); + + verifySnapshotWithTransform( + expectedSnapshot3, snapshot3, transformer, keySerializer, namespaceSerializer, stateSerializer); + snapshot3.release(); + + // value of version 1 should be pruned by snapshot3 for 1, 3, 4, 5, 7, 6 + totalSpaceNumber -= 6; + assertEquals(totalSpaceNumber, spaceAllocator.getTotalSpaceNumber()); + // logically removed states are still in map + assertEquals(totalSizeIncludingLogicalRemovedKey, stateMap.totalSize()); + + // remove the logically removed state again, and they should be deleted physically + assertNull(stateMap.removeAndGetOld(1, 1L)); + assertNull(stateMap.removeAndGetOld(3, 3L)); + assertNull(stateMap.removeAndGetOld(5, 5L)); + assertNull(stateMap.removeAndGetOld(7, 7L)); + totalLogicallyRemovedKey -= 4; + totalSizeIncludingLogicalRemovedKey -= 4; + totalSpaceNumber -= 2 * 4; + assertEquals(totalLogicallyRemovedKey, stateMap.getLogicallyRemovedNodes().size()); + assertEquals(totalStateSize, stateMap.size()); + assertEquals(totalSizeIncludingLogicalRemovedKey, stateMap.totalSize()); + assertEquals(totalSpaceNumber, spaceAllocator.getTotalSpaceNumber()); + verifyState(referenceStates, stateMap); + + Map<Long, Map<Integer, String>> expectedSnapshot4 = snapshotReferenceStates(referenceStates); + CopyOnWriteSkipListStateMapSnapshot<Integer, Long, String> snapshot4 = + (CopyOnWriteSkipListStateMapSnapshot<Integer, Long, String>) stateMap.stateSnapshot(); + + // remove all states + for (Map.Entry<Long, Map<Integer, String>> namespaceEntry : referenceStates.entrySet()) { + for (Map.Entry<Integer, String> keyEntry : namespaceEntry.getValue().entrySet()) { + assertEquals(keyEntry.getValue(), stateMap.removeAndGetOld(keyEntry.getKey(), namespaceEntry.getKey())); + totalStateSize--; + totalLogicallyRemovedKey++; + } + } + Map<Long, Map<Integer, String>> allRemovedStates = snapshotReferenceStates(referenceStates); + referenceStates.clear(); + + verifySnapshotWithTransform( + expectedSnapshot4, snapshot4, transformer, keySerializer, namespaceSerializer, stateSerializer); + snapshot4.release(); + + assertEquals(totalStateSize, stateMap.size()); + assertEquals(totalLogicallyRemovedKey, stateMap.getLogicallyRemovedNodes().size()); + + for (Map.Entry<Long, Map<Integer, String>> namespaceEntry : allRemovedStates.entrySet()) { + long namespace = namespaceEntry.getKey(); + for (Map.Entry<Integer, String> keyEntry : namespaceEntry.getValue().entrySet()) { + int key = keyEntry.getKey(); + assertNull(stateMap.get(key, namespace)); + assertFalse(stateMap.containsKey(key, namespace)); + } + assertEquals(0, stateMap.sizeOfNamespace(namespace)); + assertFalse(stateMap.getKeys(namespace).iterator().hasNext()); + assertFalse(stateMap.getStateIncrementalVisitor(100).hasNext()); + } + + stateMap.close(); + assertEquals(0, stateMap.size()); + assertEquals(0, stateMap.totalSize()); + assertEquals(0, spaceAllocator.getTotalSpaceNumber()); + assertTrue(stateMap.isClosed()); + } + + /** + * Tests that remove states physically when get, put and remove. + */ + @SuppressWarnings("unchecked") + @Test + public void testPhysicallyRemoveWhenGetPutAndRemove() throws IOException { + TypeSerializer<Integer> keySerializer = IntSerializer.INSTANCE; + TypeSerializer<Long> namespaceSerializer = LongSerializer.INSTANCE; + TypeSerializer<String> stateSerializer = StringSerializer.INSTANCE; + CopyOnWriteSkipListStateMap<Integer, Long, String> stateMap = new CopyOnWriteSkipListStateMap<>( + keySerializer, + namespaceSerializer, + stateSerializer, + spaceAllocator, + 2, + 1.0f); + + // map to store expected states, namespace -> key -> state + Map<Long, Map<Integer, String>> referenceStates = new HashMap<>(); + + // here we use a trick that put all odd namespace to state map, and get/put/remove even namespace + // so that all logically removed nodes can be accessed + + // validates get + prepareLogicallyRemovedStates( + referenceStates, stateMap, keySerializer, namespaceSerializer, stateSerializer); + for (int i = 0; i <= 100; i += 2) { + stateMap.get(i, (long) i); + } + assertEquals(0, stateMap.size()); + assertEquals(0, stateMap.totalSize()); + assertEquals(0, spaceAllocator.getTotalSpaceNumber()); + verifyState(referenceStates, stateMap); + + // validates containsKey + prepareLogicallyRemovedStates( + referenceStates, stateMap, keySerializer, namespaceSerializer, stateSerializer); + for (int i = 0; i <= 100; i += 2) { + assertFalse(stateMap.containsKey(i, (long) i)); + } + assertEquals(0, stateMap.size()); + assertEquals(0, stateMap.totalSize()); + assertEquals(0, spaceAllocator.getTotalSpaceNumber()); + verifyState(referenceStates, stateMap); + + // validates remove + prepareLogicallyRemovedStates( + referenceStates, stateMap, keySerializer, namespaceSerializer, stateSerializer); + for (int i = 0; i <= 100; i += 2) { + stateMap.remove(i, (long) i); + } + assertEquals(0, stateMap.size()); + assertEquals(0, stateMap.totalSize()); + assertEquals(0, spaceAllocator.getTotalSpaceNumber()); + verifyState(referenceStates, stateMap); + + // validates removeAndGetOld + prepareLogicallyRemovedStates( + referenceStates, stateMap, keySerializer, namespaceSerializer, stateSerializer); + for (int i = 0; i <= 100; i += 2) { + assertNull(stateMap.removeAndGetOld(i, (long) i)); + } + assertEquals(0, stateMap.size()); + assertEquals(0, stateMap.totalSize()); + assertEquals(0, spaceAllocator.getTotalSpaceNumber()); + verifyState(referenceStates, stateMap); + + // validates put + prepareLogicallyRemovedStates( + referenceStates, stateMap, keySerializer, namespaceSerializer, stateSerializer); + int putSize = 0; + for (int i = 0; i <= 100; i += 2) { + putSize++; + stateMap.put(i, (long) i, String.valueOf(i)); + addToReferenceState(referenceStates, i, (long) i, String.valueOf(i)); + } + assertEquals(putSize, stateMap.size()); + assertEquals(putSize, stateMap.totalSize()); + assertEquals(putSize * 2, spaceAllocator.getTotalSpaceNumber()); + verifyState(referenceStates, stateMap); + + for (int i = 0; i <= 100; i += 2) { + assertEquals(String.valueOf(i), stateMap.removeAndGetOld(i, (long) i)); + removeFromReferenceState(referenceStates, i, (long) i); + } + assertEquals(0, stateMap.size()); + assertEquals(0, stateMap.totalSize()); + assertEquals(0, spaceAllocator.getTotalSpaceNumber()); + verifyState(referenceStates, stateMap); + + // validates putAndGetOld + prepareLogicallyRemovedStates( + referenceStates, stateMap, keySerializer, namespaceSerializer, stateSerializer); + int putAndGetOldSize = 0; + for (int i = 0; i <= 100; i += 2) { + putAndGetOldSize++; + assertNull(stateMap.putAndGetOld(i, (long) i, String.valueOf(i))); + addToReferenceState(referenceStates, i, (long) i, String.valueOf(i)); + } + assertEquals(putAndGetOldSize, stateMap.size()); + assertEquals(putAndGetOldSize, stateMap.totalSize()); + assertEquals(putAndGetOldSize * 2, spaceAllocator.getTotalSpaceNumber()); + verifyState(referenceStates, stateMap); + + stateMap.close(); + assertEquals(0, stateMap.size()); + assertEquals(0, stateMap.totalSize()); + assertEquals(0, spaceAllocator.getTotalSpaceNumber()); + assertTrue(stateMap.isClosed()); + } + + /** + * Tests that remove states physically during sync part of snapshot. + */ + @SuppressWarnings("unchecked") + @Test + public void testPhysicallyRemoveDuringSyncPartOfSnapshot() throws IOException { + TypeSerializer<Integer> keySerializer = IntSerializer.INSTANCE; + TypeSerializer<Long> namespaceSerializer = LongSerializer.INSTANCE; + TypeSerializer<String> stateSerializer = StringSerializer.INSTANCE; + // set logicalRemovedKeysRatio to 0 so that all logically removed states will be deleted when snapshot + CopyOnWriteSkipListStateMap<Integer, Long, String> stateMap = new CopyOnWriteSkipListStateMap<>( + keySerializer, + namespaceSerializer, + stateSerializer, + spaceAllocator, + 0, + 0.0f); + + // map to store expected states, namespace -> key -> state + Map<Long, Map<Integer, String>> referenceStates = new HashMap<>(); + int totalStateSize = 0; + int totalSizeIncludingLogicallyRemovedStates = 0; + + // put some states + for (int i = 1; i <= 100; i++) { + totalStateSize++; + totalSizeIncludingLogicallyRemovedStates++; + stateMap.put(i, (long) i, String.valueOf(i)); + addToReferenceState(referenceStates, i, (long) i, String.valueOf(i)); + } + verifyState(referenceStates, stateMap); + + assertEquals(totalStateSize * 2, spaceAllocator.getTotalSpaceNumber()); + + Map<Long, Map<Integer, String>> expectedSnapshot1 = snapshotReferenceStates(referenceStates); + CopyOnWriteSkipListStateMapSnapshot<Integer, Long, String> snapshot1 = + (CopyOnWriteSkipListStateMapSnapshot<Integer, Long, String>) stateMap.stateSnapshot(); + + // remove all states logically + for (int i = 1; i <= 100; i++) { + totalStateSize--; + stateMap.remove(i, (long) i); + removeFromReferenceState(referenceStates, i, (long) i); + } + assertEquals(totalSizeIncludingLogicallyRemovedStates * 3, spaceAllocator.getTotalSpaceNumber()); + assertEquals(0, totalStateSize); + assertEquals(totalStateSize, stateMap.size()); + assertEquals(totalSizeIncludingLogicallyRemovedStates, stateMap.totalSize()); + assertEquals(totalSizeIncludingLogicallyRemovedStates, stateMap.getLogicallyRemovedNodes().size()); + verifyState(referenceStates, stateMap); + + verifySnapshotWithoutTransform( + expectedSnapshot1, snapshot1, keySerializer, namespaceSerializer, stateSerializer); + snapshot1.release(); + + // no spaces should be free + assertEquals(totalSizeIncludingLogicallyRemovedStates * 3, spaceAllocator.getTotalSpaceNumber()); + verifyState(referenceStates, stateMap); + + Map<Long, Map<Integer, String>> expectedSnapshot2 = snapshotReferenceStates(referenceStates); + CopyOnWriteSkipListStateMapSnapshot<Integer, Long, String> snapshot2 = + (CopyOnWriteSkipListStateMapSnapshot<Integer, Long, String>) stateMap.stateSnapshot(); + + // all state should be removed physically + totalSizeIncludingLogicallyRemovedStates = 0; + assertEquals(totalStateSize, stateMap.totalSize()); + assertEquals(totalSizeIncludingLogicallyRemovedStates, stateMap.totalSize()); + assertEquals(totalSizeIncludingLogicallyRemovedStates, stateMap.getLogicallyRemovedNodes().size()); + assertEquals(0, spaceAllocator.getTotalSpaceNumber()); + + verifySnapshotWithoutTransform( + expectedSnapshot2, snapshot2, keySerializer, namespaceSerializer, stateSerializer); + snapshot2.release(); + + assertEquals(0, stateMap.size()); + assertEquals(0, stateMap.totalSize()); + assertEquals(0, spaceAllocator.getTotalSpaceNumber()); + assertFalse(stateMap.iterator().hasNext()); + + stateMap.close(); + } + + /** + * Tests that snapshots prune useless values. + */ + @SuppressWarnings("unchecked") + @Test + public void testSnapshotPruneValues() throws IOException { + TypeSerializer<Integer> keySerializer = IntSerializer.INSTANCE; + TypeSerializer<Long> namespaceSerializer = LongSerializer.INSTANCE; + TypeSerializer<String> stateSerializer = StringSerializer.INSTANCE; + // set logicalRemovedKeysRatio to 0 so that all logically removed states will be deleted when snapshot + CopyOnWriteSkipListStateMap<Integer, Long, String> stateMap = new CopyOnWriteSkipListStateMap<>(keySerializer, + namespaceSerializer, + stateSerializer, + spaceAllocator); + + // firstly build value chain and snapshots as follows + // ------ ------ ------ ------ + // | v3 | -> | v2 | -> | v1 | -> | v0 | + // ------ ------ ------ ------ + // | | | | + // snapshot4 snapshot3 snapshot2 snapshot1 + // snapshot5 + // snapshot6 + + List<String> referenceValues = new ArrayList<>(); + + // build v0 + stateMap.put(1, 1L, "0"); + referenceValues.add(0, "0"); + // get the pointer to the node + long node = stateMap.getLevelIndexHeader().getNextNode(0); + + // take snapshot1 + CopyOnWriteSkipListStateMapSnapshot<Integer, Long, String> snapshot1 = + (CopyOnWriteSkipListStateMapSnapshot<Integer, Long, String>) stateMap.stateSnapshot(); + + // build v1 + stateMap.put(1, 1L, "1"); + referenceValues.add(0, "1"); + + // take snapshot2 + CopyOnWriteSkipListStateMapSnapshot<Integer, Long, String> snapshot2 = + (CopyOnWriteSkipListStateMapSnapshot<Integer, Long, String>) stateMap.stateSnapshot(); + + // build v2 + stateMap.put(1, 1L, "2"); + referenceValues.add(0, "2"); + + // take snapshot3 + CopyOnWriteSkipListStateMapSnapshot<Integer, Long, String> snapshot3 = + (CopyOnWriteSkipListStateMapSnapshot<Integer, Long, String>) stateMap.stateSnapshot(); + + // build v3 + stateMap.put(1, 1L, "3"); + referenceValues.add(0, "3"); + + // take snapshot4 + CopyOnWriteSkipListStateMapSnapshot<Integer, Long, String> snapshot4 = + (CopyOnWriteSkipListStateMapSnapshot<Integer, Long, String>) stateMap.stateSnapshot(); + + // take snapshot5 + CopyOnWriteSkipListStateMapSnapshot<Integer, Long, String> snapshot5 = + (CopyOnWriteSkipListStateMapSnapshot<Integer, Long, String>) stateMap.stateSnapshot(); + + // take snapshot6 + CopyOnWriteSkipListStateMapSnapshot<Integer, Long, String> snapshot6 = + (CopyOnWriteSkipListStateMapSnapshot<Integer, Long, String>) stateMap.stateSnapshot(); + + assertEquals(6, stateMap.getStateMapVersion()); + assertEquals(6, stateMap.getHighestRequiredSnapshotVersion()); + assertEquals(6, stateMap.getSnapshotVersions().size()); + assertEquals(5, spaceAllocator.getTotalSpaceNumber()); + assertEquals(referenceValues, getAllValuesOfNode(stateMap, spaceAllocator, node)); + + Map<Long, Map<Integer, String>> referenceStates = new HashMap<>(); + referenceStates.put(1L, new HashMap<>()); + referenceStates.get(1L).put(1, "0"); + + // complete snapshot 1, and no value will be removed + verifySnapshotWithoutTransform( + referenceStates, snapshot1, keySerializer, namespaceSerializer, stateSerializer); + snapshot1.release(); + assertEquals(referenceValues, getAllValuesOfNode(stateMap, spaceAllocator, node)); + assertEquals(5, spaceAllocator.getTotalSpaceNumber()); + assertEquals(1, stateMap.getHighestFinishedSnapshotVersion()); + + // complete snapshot 3, and v0 will be removed + referenceStates.get(1L).put(1, "2"); + verifySnapshotWithoutTransform( + referenceStates, snapshot3, keySerializer, namespaceSerializer, stateSerializer); + snapshot3.release(); + referenceValues.remove(referenceValues.size() - 1); + assertEquals(referenceValues, getAllValuesOfNode(stateMap, spaceAllocator, node)); + assertEquals(4, spaceAllocator.getTotalSpaceNumber()); + assertEquals(1, stateMap.getHighestFinishedSnapshotVersion()); + + // complete snapshot 2, and no value will be removed + referenceStates.get(1L).put(1, "1"); + verifySnapshotWithoutTransform( + referenceStates, snapshot2, keySerializer, namespaceSerializer, stateSerializer); + snapshot2.release(); + assertEquals(referenceValues, getAllValuesOfNode(stateMap, spaceAllocator, node)); + assertEquals(4, spaceAllocator.getTotalSpaceNumber()); + assertEquals(3, stateMap.getHighestFinishedSnapshotVersion()); + + // add node to pruning set to prevent snapshot4 to prune + stateMap.getPruningValueNodes().add(node); Review comment: Yes, pruning out-of-date versions of value w/o any snapshot reference is an internal processing and we'd like to assure the correctness of the logic here in this test case. ---------------------------------------------------------------- This is an automated message from the Apache Git Service. To respond to the message, please log on to GitHub and use the URL above to go to the specific comment. For queries about this service, please contact Infrastructure at: us...@infra.apache.org With regards, Apache Git Services