Note: Please use Issues only for bug reports. For questions, discussions, feature requests, etc. post to dev group: https://groups.google.com/forum/#!forum/rocksdb or https://www.facebook.com/groups/rocksdb.dev
Expected behavior
Rocks DB continues to serve reads and writes
Actual behavior
Rocks DB crashes.
Steps to reproduce the behavior
I can provide the backtrace dump reported for now. Do let me know what other pieces of information are needed.
Host: Intel(R) Xeon(R) Silver 4110 CPU @ 2.10GHz, 32 cores, 376G, Red Hat Enterprise Linux Server release 7.8 (Maipo)
Time: Mon Aug 2 17:21:25 2021 PDT elapsed time: 480.081057 seconds (0d 0h 8m 0s)
--------------- T H R E A D ---------------
Current thread (0x00007f0e02e36800): JavaThread "grpc-default-executor-24" daemon [_thread_in_native, id=48415, stack(0x00007f0defb58000,0x00007f0defc59000)]
Stack: [0x00007f0defb58000,0x00007f0defc59000], sp=0x00007f0defc56bc0, free space=1018k
Native frames: (J=compiled Java code, A=aot compiled Java code, j=interpreted, Vv=VM code, C=native code)
C [librocksdbjni15379259497632127760.so+0x29bb93] rocksdb::LegacyFileSystemWrapper::NewSequentialFile(std::string const&, rocksdb::FileOptions const&, std::unique_ptr<rocksdb::FSSequentialFile, std::default_delete<rocksdb::FSSequentialFile> >*, rocksdb::IODebugContext*)+0x33
C [librocksdbjni15379259497632127760.so+0x3d2df0] rocksdb::ReadFileToString(rocksdb::FileSystem*, std::string const&, std::string*)+0x90
C [librocksdbjni15379259497632127760.so+0x37fc0b] rocksdb::VersionSet::GetCurrentManifestPath(std::string const&, rocksdb::FileSystem*, std::string*, unsigned long*)+0x5b
C [librocksdbjni15379259497632127760.so+0x397b24] rocksdb::VersionSet::ListColumnFamilies(std::vector<std::string, std::allocator<std::string> >*, std::string const&, rocksdb::FileSystem*)+0x64
C [librocksdbjni15379259497632127760.so+0x27e7eb] rocksdb::DB::ListColumnFamilies(rocksdb::DBOptions const&, std::string const&, std::vector<std::string, std::allocator<std::string> >*)+0x5b
C [librocksdbjni15379259497632127760.so+0x1dfda9] Java_org_rocksdb_RocksDB_listColumnFamilies+0x89
J 4117 org.rocksdb.RocksDB.listColumnFamilies(JLjava/lang/String;)[[B (0 bytes) @ 0x00007f0e38785fa2 [0x00007f0e38785ec0+0x00000000000000e2]
J 16357 c2 org.apache.hadoop.hdds.utils.db.RDBStore.<init>(Ljava/io/File;Lorg/rocksdb/DBOptions;Lorg/rocksdb/WriteOptions;Ljava/util/Set;Lorg/apache/hadoop/hdds/utils/db/CodecRegistry;Z)V (717 bytes) @ 0x00007f0e3938e460 [0x00007f0e3938d9e0+0x0000000000000a80]
J 14139 c2 org.apache.hadoop.ozone.container.metadata.DatanodeStoreSchemaOneImpl.<init>(Lorg/apache/hadoop/hdds/conf/ConfigurationSource;JLjava/lang/String;Z)V (18 bytes) @ 0x00007f0e3906a668 [0x00007f0e39066b00+0x0000000000003b68]
J 15249 c2 org.apache.hadoop.ozone.container.common.utils.ContainerCache.getDB(JLjava/lang/String;Ljava/lang/String;Ljava/lang/String;Lorg/apache/hadoop/hdds/conf/ConfigurationSource;)Lorg/apache/hadoop/ozone/container/common/utils/ReferenceCountedDB; (339 bytes) @ 0x00007f0e391e30d0 [0x00007f0e391e2ac0+0x0000000000000610]
J 18254 c2 org.apache.hadoop.ozone.container.keyvalue.impl.BlockManagerImpl.getBlock(Lorg/apache/hadoop/ozone/container/common/interfaces/Container;Lorg/apache/hadoop/hdds/client/BlockID;)Lorg/apache/hadoop/ozone/container/common/helpers/BlockData; (299 bytes) @ 0x00007f0e38f40858 [0x00007f0e38f406e0+0x0000000000000178]
J 17900 c2 org.apache.hadoop.ozone.container.keyvalue.KeyValueHandler.handle(Lorg/apache/hadoop/hdds/protocol/datanode/proto/ContainerProtos$ContainerCommandRequestProto;Lorg/apache/hadoop/ozone/container/common/interfaces/Container;Lorg/apache/hadoop/ozone/container/common/transport/server/ratis/DispatcherContext;)Lorg/apache/hadoop/hdds/protocol/datanode/proto/ContainerProtos$ContainerCommandResponseProto; (11 bytes) @ 0x00007f0e3966b42c [0x00007f0e39668340+0x00000000000030ec]
J 17904 c2 org.apache.hadoop.ozone.container.common.impl.HddsDispatcher.dispatchRequest(Lorg/apache/hadoop/hdds/protocol/datanode/proto/ContainerProtos$ContainerCommandRequestProto;Lorg/apache/hadoop/ozone/container/common/transport/server/ratis/DispatcherContext;)Lorg/apache/hadoop/hdds/protocol/datanode/proto/ContainerProtos$ContainerCommandResponseProto; (1105 bytes) @ 0x00007f0e39658378 [0x00007f0e39656ba0+0x00000000000017d8]
J 8487 c2 org.apache.hadoop.hdds.server.OzoneProtocolMessageDispatcher.processRequest(Ljava/lang/Object;Lorg/apache/hadoop/hdds/function/FunctionWithServiceException;Ljava/lang/Object;Ljava/lang/String;)Ljava/lang/Object; (205 bytes) @ 0x00007f0e38c0e908 [0x00007f0e38c0e6e0+0x0000000000000228]
J 12956 c2 org.apache.hadoop.ozone.container.common.impl.HddsDispatcher.dispatch(Lorg/apache/hadoop/hdds/protocol/datanode/proto/ContainerProtos$ContainerCommandRequestProto;Lorg/apache/hadoop/ozone/container/common/transport/server/ratis/DispatcherContext;)Lorg/apache/hadoop/hdds/protocol/datanode/proto/ContainerProtos$ContainerCommandResponseProto; (38 bytes) @ 0x00007f0e38dd88d0 [0x00007f0e38dd8740+0x0000000000000190]
J 17877 c2 org.apache.hadoop.ozone.container.common.transport.server.GrpcXceiverService$1.onNext(Ljava/lang/Object;)V (9 bytes) @ 0x00007f0e3962efd8 [0x00007f0e3962ef60+0x0000000000000078]
J 17878 c2 org.apache.hadoop.hdds.tracing.GrpcServerInterceptor$1.onMessage(Ljava/lang/Object;)V (155 bytes) @ 0x00007f0e39631718 [0x00007f0e39631380+0x0000000000000398]
J 17572 c2 org.apache.ratis.thirdparty.io.grpc.internal.ServerImpl$JumpToApplicationThreadServerStreamListener$1MessagesAvailable.runInContext()V (77 bytes) @ 0x00007f0e3923dc40 [0x00007f0e3923d8c0+0x0000000000000380]
J 14423 c2 org.apache.ratis.thirdparty.io.grpc.internal.ContextRunnable.run()V (35 bytes) @ 0x00007f0e3889bf28 [0x00007f0e3889be80+0x00000000000000a8]
J 14467 c2 org.apache.ratis.thirdparty.io.grpc.internal.SerializingExecutor.run()V (99 bytes) @ 0x00007f0e38bbb27c [0x00007f0e38bbb180+0x00000000000000fc]
J 15549 c2 java.util.concurrent.ThreadPoolExecutor.runWorker(Ljava/util/concurrent/ThreadPoolExecutor$Worker;)V [email protected] (187 bytes) @ 0x00007f0e39278620 [0x00007f0e39278460+0x00000000000001c0]
J 6773 c1 java.util.concurrent.ThreadPoolExecutor$Worker.run()V [email protected] (9 bytes) @ 0x00007f0e31304be4 [0x00007f0e31304b40+0x00000000000000a4]
J 6760 c1 java.lang.Thread.run()V [email protected] (17 bytes) @ 0x00007f0e31303934 [0x00007f0e313037c0+0x0000000000000174]
v ~StubRoutines::call_stub
V [libjvm.so+0x88abd6] JavaCalls::call_helper(JavaValue*, methodHandle const&, JavaCallArguments*, Thread*)+0x366
V [libjvm.so+0x888bdd] JavaCalls::call_virtual(JavaValue*, Handle, Klass*, Symbol*, Symbol*, Thread*)+0x1ed
V [libjvm.so+0x935d0c] thread_entry(JavaThread*, Thread*)+0x6c
V [libjvm.so+0xe2c91a] JavaThread::thread_main_inner()+0x1fa
V [libjvm.so+0xe2933f] Thread::call_run()+0x14f
V [libjvm.so+0xc6fb9e] thread_native_entry(Thread*)+0xee
Java frames: (J=compiled Java code, j=interpreted, Vv=VM code)
J 4117 org.rocksdb.RocksDB.listColumnFamilies(JLjava/lang/String;)[[B (0 bytes) @ 0x00007f0e38785f2d [0x00007f0e38785ec0+0x000000000000006d]
J 16357 c2 org.apache.hadoop.hdds.utils.db.RDBStore.<init>(Ljava/io/File;Lorg/rocksdb/DBOptions;Lorg/rocksdb/WriteOptions;Ljava/util/Set;Lorg/apache/hadoop/hdds/utils/db/CodecRegistry;Z)V (717 bytes) @ 0x00007f0e3938e460 [0x00007f0e3938d9e0+0x0000000000000a80]
J 14139 c2 org.apache.hadoop.ozone.container.metadata.DatanodeStoreSchemaOneImpl.<init>(Lorg/apache/hadoop/hdds/conf/ConfigurationSource;JLjava/lang/String;Z)V (18 bytes) @ 0x00007f0e3906a668 [0x00007f0e39066b00+0x0000000000003b68]
J 15249 c2 org.apache.hadoop.ozone.container.common.utils.ContainerCache.getDB(JLjava/lang/String;Ljava/lang/String;Ljava/lang/String;Lorg/apache/hadoop/hdds/conf/ConfigurationSource;)Lorg/apache/hadoop/ozone/container/common/utils/ReferenceCountedDB; (339 bytes) @ 0x00007f0e391e30d0 [0x00007f0e391e2ac0+0x0000000000000610]
J 18254 c2 org.apache.hadoop.ozone.container.keyvalue.impl.BlockManagerImpl.getBlock(Lorg/apache/hadoop/ozone/container/common/interfaces/Container;Lorg/apache/hadoop/hdds/client/BlockID;)Lorg/apache/hadoop/ozone/container/common/helpers/BlockData; (299 bytes) @ 0x00007f0e38f40858 [0x00007f0e38f406e0+0x0000000000000178]
J 17900 c2 org.apache.hadoop.ozone.container.keyvalue.KeyValueHandler.handle(Lorg/apache/hadoop/hdds/protocol/datanode/proto/ContainerProtos$ContainerCommandRequestProto;Lorg/apache/hadoop/ozone/container/common/interfaces/Container;Lorg/apache/hadoop/ozone/container/common/transport/server/ratis/DispatcherContext;)Lorg/apache/hadoop/hdds/protocol/datanode/proto/ContainerProtos$ContainerCommandResponseProto; (11 bytes) @ 0x00007f0e3966b42c [0x00007f0e39668340+0x00000000000030ec]
J 17904 c2 org.apache.hadoop.ozone.container.common.impl.HddsDispatcher.dispatchRequest(Lorg/apache/hadoop/hdds/protocol/datanode/proto/ContainerProtos$ContainerCommandRequestProto;Lorg/apache/hadoop/ozone/container/common/transport/server/ratis/DispatcherContext;)Lorg/apache/hadoop/hdds/protocol/datanode/proto/ContainerProtos$ContainerCommandResponseProto; (1105 bytes) @ 0x00007f0e39658378 [0x00007f0e39656ba0+0x00000000000017d8]
J 8487 c2 org.apache.hadoop.hdds.server.OzoneProtocolMessageDispatcher.processRequest(Ljava/lang/Object;Lorg/apache/hadoop/hdds/function/FunctionWithServiceException;Ljava/lang/Object;Ljava/lang/String;)Ljava/lang/Object; (205 bytes) @ 0x00007f0e38c0e908 [0x00007f0e38c0e6e0+0x0000000000000228]
J 12956 c2 org.apache.hadoop.ozone.container.common.impl.HddsDispatcher.dispatch(Lorg/apache/hadoop/hdds/protocol/datanode/proto/ContainerProtos$ContainerCommandRequestProto;Lorg/apache/hadoop/ozone/container/common/transport/server/ratis/DispatcherContext;)Lorg/apache/hadoop/hdds/protocol/datanode/proto/ContainerProtos$ContainerCommandResponseProto; (38 bytes) @ 0x00007f0e38dd88d0 [0x00007f0e38dd8740+0x0000000000000190]
J 17877 c2 org.apache.hadoop.ozone.container.common.transport.server.GrpcXceiverService$1.onNext(Ljava/lang/Object;)V (9 bytes) @ 0x00007f0e3962efd8 [0x00007f0e3962ef60+0x0000000000000078]
J 17878 c2 org.apache.hadoop.hdds.tracing.GrpcServerInterceptor$1.onMessage(Ljava/lang/Object;)V (155 bytes) @ 0x00007f0e39631718 [0x00007f0e39631380+0x0000000000000398]
J 17572 c2 org.apache.ratis.thirdparty.io.grpc.internal.ServerImpl$JumpToApplicationThreadServerStreamListener$1MessagesAvailable.runInContext()V (77 bytes) @ 0x00007f0e3923dc40 [0x00007f0e3923d8c0+0x0000000000000380]
J 14423 c2 org.apache.ratis.thirdparty.io.grpc.internal.ContextRunnable.run()V (35 bytes) @ 0x00007f0e3889bf28 [0x00007f0e3889be80+0x00000000000000a8]
J 14467 c2 org.apache.ratis.thirdparty.io.grpc.internal.SerializingExecutor.run()V (99 bytes) @ 0x00007f0e38bbb27c [0x00007f0e38bbb180+0x00000000000000fc]
J 15549 c2 java.util.concurrent.ThreadPoolExecutor.runWorker(Ljava/util/concurrent/ThreadPoolExecutor$Worker;)V [email protected] (187 bytes) @ 0x00007f0e39278620 [0x00007f0e39278460+0x00000000000001c0]
J 6773 c1 java.util.concurrent.ThreadPoolExecutor$Worker.run()V [email protected] (9 bytes) @ 0x00007f0e31304be4 [0x00007f0e31304b40+0x00000000000000a4]
J 6760 c1 java.lang.Thread.run()V [email protected] (17 bytes) @ 0x00007f0e31303934 [0x00007f0e313037c0+0x0000000000000174]
v ~StubRoutines::call_stub
siginfo: si_signo: 11 (SIGSEGV), si_code: 1 (SEGV_MAPERR), si_addr: 0x0000000000000050```
[hs_err_pid70046.log](https://github.com/facebook/rocksdb/files/6926076/hs_err_pid70046.log)
java-api