Taewoo Kim created ASTERIXDB-2487:
-------------------------------------

             Summary: Cluster becomes UNUSUABLE with 
"java.lang.IllegalStateException: Couldn't find any checkpoints for resource"
                 Key: ASTERIXDB-2487
                 URL: https://issues.apache.org/jira/browse/ASTERIXDB-2487
             Project: Apache AsterixDB
          Issue Type: Bug
            Reporter: Taewoo Kim
         Attachments: nc-1.log

The Clouberry cluster became UNUSUABLE after the nc-1 (among five NCs) 
generated the following exception.

 
{code:java}
21:32:10.660 [Executor-10173:1] ERROR 
org.apache.hyracks.storage.am.lsm.common.impls.LSMHarness - FLUSH 
operation.afterFinalize failed on {"class" : "LSMBTree", "dir" : 
"/home/waans11/asterixdb/io1/storage/partition_0/twitter/ds_tweet_e9ad9c2394f7dc7b6a69fb43e52a7382/0/ds_tweet_e9ad9c2394f7dc7b6a69fb43e52a7382",
 "memory" : [{"class":"LSMBTreeMemoryComponent", 
"state":"READABLE_UNWRITABLE_FLUSHING", "writers":0, "readers":1, 
"pendingFlushes":0, "id":"[9,9]"}, {"class":"LSMBTreeMemoryComponent", 
"state":"INACTIVE", "writers":0, "readers":0, "pendingFlushes":0, 
"id":"[8,8]"}], "disk" : 3, "num-scheduled-flushes":1, 
"current-memory-component":1}
java.lang.IllegalStateException: Couldn't find any checkpoints for resource: 
io1/storage/partition_0/twitter/ds_tweet_e9ad9c2394f7dc7b6a69fb43e52a7382/0/ds_tweet_e9ad9c2394f7dc7b6a69fb43e52a7382
at 
org.apache.asterix.app.nc.IndexCheckpointManager.getLatest(IndexCheckpointManager.java:145)
 ~[asterix-app-0.9.5-SNAPSHOT.jar:0.9.5-SNAPSHOT]
at 
org.apache.asterix.app.nc.IndexCheckpointManager.flushed(IndexCheckpointManager.java:86)
 ~[asterix-app-0.9.5-SNAPSHOT.jar:0.9.5-SNAPSHOT]
at 
org.apache.asterix.common.ioopcallbacks.LSMIOOperationCallback.addComponentToCheckpoint(LSMIOOperationCallback.java:136)
 ~[asterix-common-0.9.5-SNAPSHOT.jar:0.9.5-SNAPSHOT]
at 
org.apache.asterix.common.ioopcallbacks.LSMIOOperationCallback.afterFinalize(LSMIOOperationCallback.java:123)
 ~[asterix-common-0.9.5-SNAPSHOT.jar:0.9.5-SNAPSHOT]
at 
org.apache.hyracks.storage.am.lsm.common.impls.LSMHarness.doIo(LSMHarness.java:544)
 [hyracks-storage-am-lsm-common-0.3.5-SNAPSHOT.jar:0.3.5-SNAPSHOT]
at 
org.apache.hyracks.storage.am.lsm.common.impls.LSMHarness.flush(LSMHarness.java:513)
 [hyracks-storage-am-lsm-common-0.3.5-SNAPSHOT.jar:0.3.5-SNAPSHOT]
at 
org.apache.hyracks.storage.am.lsm.common.impls.LSMTreeIndexAccessor.flush(LSMTreeIndexAccessor.java:122)
 [hyracks-storage-am-lsm-common-0.3.5-SNAPSHOT.jar:0.3.5-SNAPSHOT]
at 
org.apache.hyracks.storage.am.lsm.common.impls.FlushOperation.call(FlushOperation.java:38)
 [hyracks-storage-am-lsm-common-0.3.5-SNAPSHOT.jar:0.3.5-SNAPSHOT]
at 
org.apache.hyracks.storage.am.lsm.common.impls.FlushOperation.call(FlushOperation.java:29)
 [hyracks-storage-am-lsm-common-0.3.5-SNAPSHOT.jar:0.3.5-SNAPSHOT]
at java.util.concurrent.FutureTask.run(FutureTask.java:266) [?:1.8.0_161]
at 
java.util.concurrent.ThreadPoolExecutor.runWorker(ThreadPoolExecutor.java:1149) 
[?:1.8.0_161]
at 
java.util.concurrent.ThreadPoolExecutor$Worker.run(ThreadPoolExecutor.java:624) 
[?:1.8.0_161]
at java.lang.Thread.run(Thread.java:748) [?:1.8.0_161]
21:32:10.663 [Executor-10172:1] ERROR 
org.apache.hyracks.storage.am.lsm.common.impls.LSMHarness - FLUSH 
operation.afterFinalize failed on {"class" : "LSMBTree", "dir" : 
"/home/waans11/asterixdb/io2/storage/partition_1/twitter/ds_tweet_9460370bb0ca1c98a779b1bcc6861c2c/0/ds_tweet_9460370bb0ca1c98a779b1bcc6861c2c",
 "memory" : [{"class":"LSMBTreeMemoryComponent", 
"state":"READABLE_UNWRITABLE_FLUSHING", "writers":0, "readers":1, 
"pendingFlushes":0, "id":"[24,24]"}, {"class":"LSMBTreeMemoryComponent", 
"state":"INACTIVE", "writers":0, "readers":0, "pendingFlushes":0, 
"id":"[23,23]"}], "disk" : 4, "num-scheduled-flushes":1, 
"current-memory-component":1}
java.lang.IllegalStateException: Couldn't find any checkpoints for resource: 
io2/storage/partition_1/twitter/ds_tweet_9460370bb0ca1c98a779b1bcc6861c2c/0/ds_tweet_9460370bb0ca1c98a779b1bcc6861c2c
at 
org.apache.asterix.app.nc.IndexCheckpointManager.getLatest(IndexCheckpointManager.java:145)
 ~[asterix-app-0.9.5-SNAPSHOT.jar:0.9.5-SNAPSHOT]
at 
org.apache.asterix.app.nc.IndexCheckpointManager.flushed(IndexCheckpointManager.java:86)
 ~[asterix-app-0.9.5-SNAPSHOT.jar:0.9.5-SNAPSHOT]
at 
org.apache.asterix.common.ioopcallbacks.LSMIOOperationCallback.addComponentToCheckpoint(LSMIOOperationCallback.java:136)
 ~[asterix-common-0.9.5-SNAPSHOT.jar:0.9.5-SNAPSHOT]
at 
org.apache.asterix.common.ioopcallbacks.LSMIOOperationCallback.afterFinalize(LSMIOOperationCallback.java:123)
 ~[asterix-common-0.9.5-SNAPSHOT.jar:0.9.5-SNAPSHOT]
at 
org.apache.asterix.common.ioopcallbacks.LSMIOOperationCallback.addComponentToCheckpoint(LSMIOOperationCallback.java:136)
 ~[asterix-common-0.9.5-SNAPSHOT.jar:0.9.5-SNAPSHOT]
at 
org.apache.asterix.common.ioopcallbacks.LSMIOOperationCallback.afterFinalize(LSMIOOperationCallback.java:123)
 ~[asterix-common-0.9.5-SNAPSHOT.jar:0.9.5-SNAPSHOT]
at 
org.apache.hyracks.storage.am.lsm.common.impls.LSMHarness.doIo(LSMHarness.java:544)
 [hyracks-storage-am-lsm-common-0.3.5-SNAPSHOT.jar:0.3.5-SNAPSHOT]
at 
org.apache.hyracks.storage.am.lsm.common.impls.LSMHarness.flush(LSMHarness.java:513)
 [hyracks-storage-am-lsm-common-0.3.5-SNAPSHOT.jar:0.3.5-SNAPSHOT]
at 
org.apache.hyracks.storage.am.lsm.common.impls.LSMTreeIndexAccessor.flush(LSMTreeIndexAccessor.java:122)
 [hyracks-storage-am-lsm-common-0.3.5-SNAPSHOT.jar:0.3.5-SNAPSHOT]
at 
org.apache.hyracks.storage.am.lsm.common.impls.FlushOperation.call(FlushOperation.java:38)
 [hyracks-storage-am-lsm-common-0.3.5-SNAPSHOT.jar:0.3.5-SNAPSHOT]
at 
org.apache.hyracks.storage.am.lsm.common.impls.FlushOperation.call(FlushOperation.java:29)
 [hyracks-storage-am-lsm-common-0.3.5-SNAPSHOT.jar:0.3.5-SNAPSHOT]
at java.util.concurrent.FutureTask.run(FutureTask.java:266) [?:1.8.0_161]
at 
java.util.concurrent.ThreadPoolExecutor.runWorker(ThreadPoolExecutor.java:1149) 
[?:1.8.0_161]
at 
java.util.concurrent.ThreadPoolExecutor$Worker.run(ThreadPoolExecutor.java:624) 
[?:1.8.0_161]
at java.lang.Thread.run(Thread.java:748) [?:1.8.0_161]
21:32:10.690 [Executor-10172:1] ERROR org.apache.asterix.app.nc.HaltCallback - 
Operation 
org.apache.hyracks.storage.am.lsm.btree.impls.LSMBTreeFlushOperation@b305d582 
has failed
java.lang.IllegalStateException: Couldn't find any checkpoints for resource: 
io2/storage/partition_1/twitter/ds_tweet_9460370bb0ca1c98a779b1bcc6861c2c/0/ds_tweet_9460370bb0ca1c98a779b1bcc6861c2c
at 
org.apache.asterix.app.nc.IndexCheckpointManager.getLatest(IndexCheckpointManager.java:145)
 ~[asterix-app-0.9.5-SNAPSHOT.jar:0.9.5-SNAPSHOT]
at 
org.apache.asterix.app.nc.IndexCheckpointManager.flushed(IndexCheckpointManager.java:86)
 ~[asterix-app-0.9.5-SNAPSHOT.jar:0.9.5-SNAPSHOT]
at 
org.apache.asterix.common.ioopcallbacks.LSMIOOperationCallback.addComponentToCheckpoint(LSMIOOperationCallback.java:136)
 ~[asterix-common-0.9.5-SNAPSHOT.jar:0.9.5-SNAPSHOT]
at 
org.apache.asterix.common.ioopcallbacks.LSMIOOperationCallback.afterFinalize(LSMIOOperationCallback.java:123)
 ~[asterix-common-0.9.5-SNAPSHOT.jar:0.9.5-SNAPSHOT]
at 
org.apache.hyracks.storage.am.lsm.common.impls.LSMHarness.doIo(LSMHarness.java:544)
 ~[hyracks-storage-am-lsm-common-0.3.5-SNAPSHOT.jar:0.3.5-SNAPSHOT]
at 
org.apache.hyracks.storage.am.lsm.common.impls.LSMHarness.flush(LSMHarness.java:513)
 ~[hyracks-storage-am-lsm-common-0.3.5-SNAPSHOT.jar:0.3.5-SNAPSHOT]
at 
org.apache.hyracks.storage.am.lsm.common.impls.LSMTreeIndexAccessor.flush(LSMTreeIndexAccessor.java:122)
 ~[hyracks-storage-am-lsm-common-0.3.5-SNAPSHOT.jar:0.3.5-SNAPSHOT]
at 
org.apache.hyracks.storage.am.lsm.common.impls.FlushOperation.call(FlushOperation.java:38)
 ~[hyracks-storage-am-lsm-common-0.3.5-SNAPSHOT.jar:0.3.5-SNAPSHOT]
at 
org.apache.hyracks.storage.am.lsm.common.impls.FlushOperation.call(FlushOperation.java:29)
 ~[hyracks-storage-am-lsm-common-0.3.5-SNAPSHOT.jar:0.3.5-SNAPSHOT]
at java.util.concurrent.FutureTask.run(FutureTask.java:266) ~[?:1.8.0_161]
at 
java.util.concurrent.ThreadPoolExecutor.runWorker(ThreadPoolExecutor.java:1149) 
[?:1.8.0_161]
at 
java.util.concurrent.ThreadPoolExecutor$Worker.run(ThreadPoolExecutor.java:624) 
[?:1.8.0_161]
at java.lang.Thread.run(Thread.java:748) [?:1.8.0_161]{code}



--
This message was sent by Atlassian JIRA
(v7.6.3#76005)

Reply via email to