You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@hbase.apache.org by te...@apache.org on 2011/12/31 16:43:19 UTC
svn commit: r1226110 - in /hbase/trunk: CHANGES.txt
src/main/java/org/apache/hadoop/hbase/master/AssignmentManager.java
Author: tedyu
Date: Sat Dec 31 15:43:19 2011
New Revision: 1226110
URL: http://svn.apache.org/viewvc?rev=1226110&view=rev
Log:
HBASE-4397 -ROOT-, .META. tables stay offline for too long in recovery phase after all RSs
are shutdown at the same time (Ming Ma)
Modified:
hbase/trunk/CHANGES.txt
hbase/trunk/src/main/java/org/apache/hadoop/hbase/master/AssignmentManager.java
Modified: hbase/trunk/CHANGES.txt
URL: http://svn.apache.org/viewvc/hbase/trunk/CHANGES.txt?rev=1226110&r1=1226109&r2=1226110&view=diff
==============================================================================
--- hbase/trunk/CHANGES.txt (original)
+++ hbase/trunk/CHANGES.txt Sat Dec 31 15:43:19 2011
@@ -466,6 +466,8 @@ Release 0.92.0 - Unreleased
HBASE-5099 ZK event thread waiting for root region assignment may block server
shutdown handler for the region sever the root region was on (Jimmy)
HBASE-5100 Rollback of split could cause closed region to be opened again (Chunhui)
+ HBASE-4397 -ROOT-, .META. tables stay offline for too long in recovery phase after all RSs
+ are shutdown at the same time (Ming Ma)
TESTS
HBASE-4450 test for number of blocks read: to serve as baseline for expected
Modified: hbase/trunk/src/main/java/org/apache/hadoop/hbase/master/AssignmentManager.java
URL: http://svn.apache.org/viewvc/hbase/trunk/src/main/java/org/apache/hadoop/hbase/master/AssignmentManager.java?rev=1226110&r1=1226109&r2=1226110&view=diff
==============================================================================
--- hbase/trunk/src/main/java/org/apache/hadoop/hbase/master/AssignmentManager.java (original)
+++ hbase/trunk/src/main/java/org/apache/hadoop/hbase/master/AssignmentManager.java Sat Dec 31 15:43:19 2011
@@ -191,7 +191,7 @@ public class AssignmentManager extends Z
Configuration conf = master.getConfiguration();
this.timeoutMonitor = new TimeoutMonitor(
conf.getInt("hbase.master.assignment.timeoutmonitor.period", 10000),
- master,
+ master, serverManager,
conf.getInt("hbase.master.assignment.timeoutmonitor.timeout", 1800000));
Threads.setDaemonThreadRunning(timeoutMonitor.getThread(),
master.getServerName() + ".timeoutMonitor");
@@ -1498,6 +1498,7 @@ public class AssignmentManager extends Z
state.update(RegionState.State.OFFLINE);
// Force a new plan and reassign. Will return null if no servers.
if (getRegionPlan(state, plan.getDestination(), true) == null) {
+ this.timeoutMonitor.setAllRegionServersOffline(true);
LOG.warn("Unable to find a viable location to assign region " +
state.getRegion().getRegionNameAsString());
return;
@@ -2512,6 +2513,8 @@ public class AssignmentManager extends Z
public class TimeoutMonitor extends Chore {
private final int timeout;
private boolean bulkAssign = false;
+ private boolean allRegionServersOffline = false;
+ private ServerManager serverManager;
/**
* Creates a periodic monitor to check for time outs on region transition
@@ -2523,9 +2526,11 @@ public class AssignmentManager extends Z
* @param timeout
*/
public TimeoutMonitor(final int period, final Stoppable stopper,
+ ServerManager serverManager,
final int timeout) {
super("AssignmentTimeoutMonitor", period, stopper);
this.timeout = timeout;
+ this.serverManager = serverManager;
}
/**
@@ -2539,10 +2544,18 @@ public class AssignmentManager extends Z
return result;
}
+ private synchronized void setAllRegionServersOffline(
+ boolean allRegionServersOffline) {
+ this.allRegionServersOffline = allRegionServersOffline;
+ }
+
@Override
protected void chore() {
// If bulkAssign in progress, suspend checks
if (this.bulkAssign) return;
+ boolean allRSsOffline = this.serverManager.getOnlineServersList().
+ isEmpty();
+
synchronized (regionsInTransition) {
// Iterate all regions in transition checking for time outs
long now = System.currentTimeMillis();
@@ -2550,9 +2563,14 @@ public class AssignmentManager extends Z
if (regionState.getStamp() + timeout <= now) {
//decide on action upon timeout
actOnTimeOut(regionState);
+ } else if (this.allRegionServersOffline && !allRSsOffline) {
+ // if some RSs just came back online, we can start the
+ // the assignment right away
+ actOnTimeOut(regionState);
}
}
}
+ setAllRegionServersOffline(allRSsOffline);
}
private void actOnTimeOut(RegionState regionState) {