From ae77f81e7eaf07e9943688f10f7f7e14211151c2 Mon Sep 17 00:00:00 2001 From: Bo Cui Date: Mon, 4 Jan 2021 23:34:38 +0800 Subject: [PATCH] HBASE-25447 remoteProc is suspended due to OOM ERROR (#2824) Some OMME can not cause the JVM to exit, like "java.lang.OutOfMemoryError: Direct buffer memory", "java.lang.OutOfMemoryError: unable to create new native thread", as they dont call vmError#next_OnError_command. So abort HMaster when uncaught exception occurs in TimeoutExecutor, the new active Hmaster will resume the suspended procedure. Signed-off-by: Duo Zhang Signed-off-by: stack Signed-off-by: Pankaj Kumar (cherry picked from commit 600be60a4bd4d3b3e9652027a0cb8bdd32016c6b) --- .../hbase/procedure2/RemoteProcedureDispatcher.java | 4 ++++ .../hbase/master/procedure/RSProcedureDispatcher.java | 8 ++++++++ 2 files changed, 12 insertions(+) diff --git a/hbase-procedure/src/main/java/org/apache/hadoop/hbase/procedure2/RemoteProcedureDispatcher.java b/hbase-procedure/src/main/java/org/apache/hadoop/hbase/procedure2/RemoteProcedureDispatcher.java index 71d55ea9afb..8a5a19ea2db 100644 --- a/hbase-procedure/src/main/java/org/apache/hadoop/hbase/procedure2/RemoteProcedureDispatcher.java +++ b/hbase-procedure/src/main/java/org/apache/hadoop/hbase/procedure2/RemoteProcedureDispatcher.java @@ -106,6 +106,10 @@ public abstract class RemoteProcedureDispatcher