From ff122f80b9b85176adb616306938f64fa62e963f Mon Sep 17 00:00:00 2001 From: stack Date: Thu, 9 Jul 2015 16:46:17 -0700 Subject: [PATCH] HBASE-14053 Disable DLR in branch-1+ --- .../org/apache/hadoop/hbase/HConstants.java | 5 +- .../src/main/resources/hbase-default.xml | 51 ++++++++----------- src/main/asciidoc/_chapters/architecture.adoc | 11 +--- 3 files changed, 22 insertions(+), 45 deletions(-) diff --git a/hbase-common/src/main/java/org/apache/hadoop/hbase/HConstants.java b/hbase-common/src/main/java/org/apache/hadoop/hbase/HConstants.java index 32f07cbedc1..704b90fd2bb 100644 --- a/hbase-common/src/main/java/org/apache/hadoop/hbase/HConstants.java +++ b/hbase-common/src/main/java/org/apache/hadoop/hbase/HConstants.java @@ -892,10 +892,7 @@ public final class HConstants { /** Conf key that enables unflushed WAL edits directly being replayed to region servers */ public static final String DISTRIBUTED_LOG_REPLAY_KEY = "hbase.master.distributed.log.replay"; - /** - * Default 'distributed log replay' as true since hbase 0.99.0 - */ - public static final boolean DEFAULT_DISTRIBUTED_LOG_REPLAY_CONFIG = true; + public static final boolean DEFAULT_DISTRIBUTED_LOG_REPLAY_CONFIG = false; public static final String DISALLOW_WRITES_IN_RECOVERING = "hbase.regionserver.disallow.writes.when.recovering"; public static final boolean DEFAULT_DISALLOW_WRITES_IN_RECOVERING_CONFIG = false; diff --git a/hbase-common/src/main/resources/hbase-default.xml b/hbase-common/src/main/resources/hbase-default.xml index 5d5bb1093b4..1ad15bb3837 100644 --- a/hbase-common/src/main/resources/hbase-default.xml +++ b/hbase-common/src/main/resources/hbase-default.xml @@ -283,17 +283,6 @@ possible configurations would overwhelm and obscure the important. org.apache.hadoop.hbase.regionserver.wal.ProtobufLogWriter The WAL file writer implementation. - - hbase.master.distributed.log.replay - true - Enable 'distributed log replay' as default engine splitting - WAL files on server crash. This default is new in hbase 1.0. To fall - back to the old mode 'distributed log splitter', set the value to - 'false'. 'Disributed log replay' improves MTTR because it does not - write intermediate files. 'DLR' required that 'hfile.format.version' - be set to version 3 or higher. - - hbase.regionserver.global.memstore.size @@ -309,7 +298,7 @@ possible configurations would overwhelm and obscure the important. Maximum size of all memstores in a region server before flushes are forced. Defaults to 95% of hbase.regionserver.global.memstore.size (0.95). - A 100% value for this value causes the minimum possible flushing to occur when updates are + A 100% value for this value causes the minimum possible flushing to occur when updates are blocked due to memstore limiting. The default value in this configuration has been intentionally left emtpy in order to honor the old hbase.regionserver.global.memstore.lowerLimit property if present. @@ -793,9 +782,9 @@ possible configurations would overwhelm and obscure the important. hbase.hstore.time.to.purge.deletes 0 - The amount of time to delay purging of delete markers with future timestamps. If - unset, or set to 0, all delete markers, including those with future timestamps, are purged - during the next major compaction. Otherwise, a delete marker is kept until the major compaction + The amount of time to delay purging of delete markers with future timestamps. If + unset, or set to 0, all delete markers, including those with future timestamps, are purged + during the next major compaction. Otherwise, a delete marker is kept until the major compaction which occurs after the marker's timestamp plus the value of this setting, in milliseconds. @@ -896,7 +885,7 @@ possible configurations would overwhelm and obscure the important. The HFile format version to use for new files. Version 3 adds support for tags in hfiles (See http://hbase.apache.org/book.html#hbase.tags). Distributed Log Replay requires that tags are enabled. Also see the configuration - 'hbase.replication.rpc.codec'. + 'hbase.replication.rpc.codec'. @@ -1313,7 +1302,7 @@ possible configurations would overwhelm and obscure the important. fails, we will switch back to using HDFS checksums (so do not disable HDFS checksums! And besides this feature applies to hfiles only, not to WALs). If this parameter is set to false, then hbase will not verify any checksums, - instead it will depend on checksum verification being done in the HDFS client. + instead it will depend on checksum verification being done in the HDFS client. @@ -1456,11 +1445,11 @@ possible configurations would overwhelm and obscure the important. hbase.procedure.regionserver.classes - A comma-separated list of - org.apache.hadoop.hbase.procedure.RegionServerProcedureManager procedure managers that are - loaded by default on the active HRegionServer process. The lifecycle methods (init/start/stop) - will be called by the active HRegionServer process to perform the specific globally barriered - procedure. After implementing your own RegionServerProcedureManager, just put it in + A comma-separated list of + org.apache.hadoop.hbase.procedure.RegionServerProcedureManager procedure managers that are + loaded by default on the active HRegionServer process. The lifecycle methods (init/start/stop) + will be called by the active HRegionServer process to perform the specific globally barriered + procedure. After implementing your own RegionServerProcedureManager, just put it in HBase's classpath and add the fully qualified class name here. @@ -1501,8 +1490,8 @@ possible configurations would overwhelm and obscure the important. which will tail the logs and replicate the mutatations to region replicas for tables that have region replication > 1. If this is enabled once, disabling this replication also requires disabling the replication peer using shell or ReplicationAdmin java class. - Replication to secondary region replicas works over standard inter-cluster replication. - So replication, if disabled explicitly, also has to be enabled by setting "hbase.replication" + Replication to secondary region replicas works over standard inter-cluster replication. + So replication, if disabled explicitly, also has to be enabled by setting "hbase.replication" to true for this feature to work. @@ -1510,12 +1499,12 @@ possible configurations would overwhelm and obscure the important. hbase.http.filter.initializers org.apache.hadoop.hbase.http.lib.StaticUserWebFilter - A comma separated list of class names. Each class in the list must extend - org.apache.hadoop.hbase.http.FilterInitializer. The corresponding Filter will - be initialized. Then, the Filter will be applied to all user facing jsp - and servlet web pages. + A comma separated list of class names. Each class in the list must extend + org.apache.hadoop.hbase.http.FilterInitializer. The corresponding Filter will + be initialized. Then, the Filter will be applied to all user facing jsp + and servlet web pages. The ordering of the list defines the ordering of the filters. - The default StaticUserWebFilter add a user principal as defined by the + The default StaticUserWebFilter add a user principal as defined by the hbase.http.staticuser.user property. @@ -1531,7 +1520,7 @@ possible configurations would overwhelm and obscure the important. hbase.http.max.threads 10 - The maximum number of threads that the HTTP Server will create in its + The maximum number of threads that the HTTP Server will create in its ThreadPool. @@ -1540,7 +1529,7 @@ possible configurations would overwhelm and obscure the important. org.apache.hadoop.hbase.codec.KeyValueCodecWithTags The codec that is to be used when replication is enabled so that - the tags are also replicated. This is used along with HFileV3 which + the tags are also replicated. This is used along with HFileV3 which supports tags in them. If tags are not used or if the hfile version used is HFileV2 then KeyValueCodec can be used as the replication codec. Note that using KeyValueCodecWithTags for replication when there are no tags causes no harm. diff --git a/src/main/asciidoc/_chapters/architecture.adoc b/src/main/asciidoc/_chapters/architecture.adoc index bee1c16b21a..740b5851a24 100644 --- a/src/main/asciidoc/_chapters/architecture.adoc +++ b/src/main/asciidoc/_chapters/architecture.adoc @@ -1016,16 +1016,7 @@ For background, see link:https://issues.apache.org/jira/browse/HBASE-2643[HBASE- ===== Performance Improvements during Log Splitting -WAL log splitting and recovery can be resource intensive and take a long time, depending on the number of RegionServers involved in the crash and the size of the regions. <> and <> were developed to improve performance during log splitting. - -[[distributed.log.splitting]] -====== Distributed Log Splitting - -_Distributed Log Splitting_ was added in HBase version 0.92 (link:https://issues.apache.org/jira/browse/HBASE-1364[HBASE-1364]) by Prakash Khemani from Facebook. -It reduces the time to complete log splitting dramatically, improving the availability of regions and tables. -For example, recovering a crashed cluster took around 9 hours with single-threaded log splitting, but only about six minutes with distributed log splitting. - -The information in this section is sourced from Jimmy Xiang's blog post at http://blog.cloudera.com/blog/2012/07/hbase-log-splitting/. +WAL log splitting and recovery can be resource intensive and take a long time, depending on the number of RegionServers involved in the crash and the size of the regions. <> was developed to improve performance during log splitting. .Enabling or Disabling Distributed Log Splitting