diff --git a/src/main/docbkx/book.xml b/src/main/docbkx/book.xml
index b0273b2be1e..70e44811c3d 100644
--- a/src/main/docbkx/book.xml
+++ b/src/main/docbkx/book.xml
@@ -34,7 +34,7 @@
     <subtitle><link xlink:href="http://www.hbase.org">
            <inlinemediaobject>
                <imageobject>
-                   <imagedata align="middle" valign="middle" fileref="hbase_logo.png" />
+                   <imagedata align="center" valign="middle" fileref="hbase_logo.png" />
                </imageobject>
            </inlinemediaobject>
        </link>
@@ -104,8 +104,7 @@
       column
       <emphasis>contents:html</emphasis> is made up of the column family <varname>contents</varname>
       and <varname>html</varname> qualifier.
-          The colon character (<literal
-          moreinfo="none">:</literal>) delimits the column family from the
+          The colon character (<literal>:</literal>) delimits the column family from the
           column family <emphasis>qualifier</emphasis>.
     </para>
     </note>
@@ -189,53 +188,58 @@
       A namespace is a logical grouping of tables analogous to a database in relation database
         systems. This abstraction lays the groundwork for upcoming multi-tenancy related features:
         <itemizedlist>
-          <listitem>Quota Management (HBASE-8410) - Restrict the amount of resources (ie
-            regions, tables) a namespace can consume.</listitem>
-          <listitem>Namespace Security Administration (HBASE-9206) - provide another
-            level of security administration for tenants.</listitem>
-          <listitem>Region server groups (HBASE-6721) - A namespace/table can be
+          <listitem><para>Quota Management (HBASE-8410) - Restrict the amount of resources (ie
+            regions, tables) a namespace can consume.</para></listitem>
+          <listitem><para>Namespace Security Administration (HBASE-9206) - provide another
+            level of security administration for tenants.</para></listitem>
+          <listitem><para>Region server groups (HBASE-6721) - A namespace/table can be
             pinned onto a subset of regionservers thus guaranteeing a course level of
-            isolation.</listitem>
+            isolation.</para></listitem>
         </itemizedlist>
       </para>
       <section xml:id="namespace_creation">
         <title>Namespace management</title>
         <para>
         A namespace can be created, removed or altered. Namespace membership is determined during
-          table creation by specifying a fully-qualified table name of the form:
-          <para>
-            <code>&lt;table namespace&gt;:&lt;table qualifier&gt;</code>
-          </para>
-          <para>
-            Examples:
-          </para>
-<programlisting>
+          table creation by specifying a fully-qualified table name of the form:</para>
+  
+            <programlisting>&lt;table namespace&gt;:&lt;table qualifier&gt;</programlisting>
+          
+
+        <example>
+          <title>Examples</title>
+
+            <programlisting>
 #Create a namespace
 create_namespace 'my_ns'
-
+            </programlisting>
+          <programlisting>
 #create my_table in my_ns namespace
 create 'my_ns:my_table', 'fam'
-
+          </programlisting>
+          <programlisting>
 #drop namespace
 drop_namespace 'my_ns'
-
+          </programlisting>
+          <programlisting>
 #alter namespace
 alter_namespace 'my_ns', {METHOD => 'set', 'PROPERTY_NAME' => 'PROPERTY_VALUE'}
-</programlisting>
-        </para>
+        </programlisting>
+        </example>
       </section>
       <section xml:id="namespace_special">
         <title>Predefined namespaces</title>
         <para>
           There are two predefined special namespaces:
           <itemizedlist>
-            <listitem>hbase - system namespace, used to contain hbase internal tables</listitem>
-            <listitem>default - tables with no explicit specified namespace will automatically
-              fall into this namespace.</listitem>
+            <listitem><para>hbase - system namespace, used to contain hbase internal tables</para></listitem>
+            <listitem><para>default - tables with no explicit specified namespace will automatically
+              fall into this namespace.</para></listitem>
           </itemizedlist>
         </para>
-        <para>
-          Examples:
+<example>
+  <title>Examples</title>
+
 <programlisting>
 #namespace=foo and table qualifier=bar
 create 'foo:bar', 'fam'
@@ -243,7 +247,7 @@ create 'foo:bar', 'fam'
 #namespace=default and table qualifier=bar
 create 'bar', 'fam'
 </programlisting>
-        </para>
+        </example>
       </section>
     </section>
 
@@ -271,8 +275,8 @@ create 'bar', 'fam'
       <emphasis>courses:math</emphasis> are both members of the
       <emphasis>courses</emphasis> column family.
           The colon character (<literal
-          moreinfo="none">:</literal>) delimits the column family from the
-      <indexterm>column family <emphasis>qualifier</emphasis><primary>Column Family Qualifier</primary></indexterm>.
+          >:</literal>) delimits the column family from the
+          <indexterm><primary>column family qualifier</primary><secondary>Column Family Qualifier</secondary></indexterm>.
         The column family prefix must be composed of
       <emphasis>printable</emphasis> characters. The qualifying tail, the
       column family <emphasis>qualifier</emphasis>, can be made of any
@@ -651,9 +655,9 @@ htable.put(put);
       </para>
     </section>
     <section xml:id="acid"><title>ACID</title>
-        <pre>See <link xlink:href="http://hbase.apache.org/acid-semantics.html">ACID Semantics</link>.
+        <para>See <link xlink:href="http://hbase.apache.org/acid-semantics.html">ACID Semantics</link>.
             Lars Hofhansl has also written a note on
-            <link xlink:href="http://hadoop-hbase.blogspot.com/2012/03/acid-in-hbase.html">ACID in HBase</link>.</pre>
+            <link xlink:href="http://hadoop-hbase.blogspot.com/2012/03/acid-in-hbase.html">ACID in HBase</link>.</para>
     </section>
   </chapter>  <!-- data model -->
 
@@ -794,7 +798,7 @@ public static class MyMapper extends TableMapper&lt;Text, Text&gt; {
     <section xml:id="mapreduce.example.readwrite">
     <title>HBase MapReduce Read/Write Example</title>
     <para>The following is an example of using HBase both as a source and as a sink with MapReduce.
-    This example will simply copy data from one table to another.
+    This example will simply copy data from one table to another.</para>
     <programlisting>
 Configuration config = HBaseConfiguration.create();
 Job job = new Job(config,"ExampleReadWrite");
@@ -823,11 +827,11 @@ if (!b) {
     throw new IOException("error with job!");
 }
     </programlisting>
-	An explanation is required of what <classname>TableMapReduceUtil</classname> is doing, especially with the reducer.
+	<para>An explanation is required of what <classname>TableMapReduceUtil</classname> is doing, especially with the reducer.
 	<link xlink:href="http://hbase.apache.org/apidocs/org/apache/hadoop/hbase/mapreduce/TableOutputFormat.html">TableOutputFormat</link> is being used
 	as the outputFormat class, and several parameters are being set on the config (e.g., TableOutputFormat.OUTPUT_TABLE), as
 	well as setting the reducer output key to <classname>ImmutableBytesWritable</classname> and reducer value to <classname>Writable</classname>.
-	These could be set by the programmer on the job and conf, but <classname>TableMapReduceUtil</classname> tries to make things easier.
+	These could be set by the programmer on the job and conf, but <classname>TableMapReduceUtil</classname> tries to make things easier.</para>
 	<para>The following is the example mapper, which will create a <classname>Put</classname> and matching the input <classname>Result</classname>
 	and emit it.  Note:  this is what the CopyTable utility does.
 	</para>
@@ -854,7 +858,6 @@ public static class MyMapper extends TableMapper&lt;ImmutableBytesWritable, Put&
     <para>This is just an example, developers could choose not to use <classname>TableOutputFormat</classname> and connect to the
     target table themselves.
     </para>
-    </para>
     </section>
     <section xml:id="mapreduce.example.readwrite.multi">
       <title>HBase MapReduce Read/Write Example With Multi-Table Output</title>
@@ -962,8 +965,8 @@ if (!b) {
 	throw new IOException("error with job!");
 }
     </programlisting>
-    As stated above, the previous Mapper can run unchanged with this example.
-    As for the Reducer, it is a "generic" Reducer instead of extending TableMapper and emitting Puts.
+    <para>As stated above, the previous Mapper can run unchanged with this example.
+    As for the Reducer, it is a "generic" Reducer instead of extending TableMapper and emitting Puts.</para>
     <programlisting>
  public static class MyReducer extends Reducer&lt;Text, IntWritable, Text, IntWritable&gt;  {
 
@@ -1082,18 +1085,18 @@ if (!b) {
 	  RDBMS can scale well, but only up to a point - specifically, the size of a single database server - and for the best
 	  performance requires specialized hardware and storage devices.  HBase features of note are:
 	        <itemizedlist>
-              <listitem>Strongly consistent reads/writes:  HBase is not an "eventually consistent" DataStore.  This
-              makes it very suitable for tasks such as high-speed counter aggregation.  </listitem>
-              <listitem>Automatic sharding:  HBase tables are distributed on the cluster via regions, and regions are
-              automatically split and re-distributed as your data grows.</listitem>
-              <listitem>Automatic RegionServer failover</listitem>
-              <listitem>Hadoop/HDFS Integration:  HBase supports HDFS out of the box as its distributed file system.</listitem>
-              <listitem>MapReduce:  HBase supports massively parallelized processing via MapReduce for using HBase as both
-              source and sink.</listitem>
-              <listitem>Java Client API:  HBase supports an easy to use Java API for programmatic access.</listitem>
-              <listitem>Thrift/REST API:  HBase also supports Thrift and REST for non-Java front-ends.</listitem>
-              <listitem>Block Cache and Bloom Filters:  HBase supports a Block Cache and Bloom Filters for high volume query optimization.</listitem>
-              <listitem>Operational Management:  HBase provides build-in web-pages for operational insight as well as JMX metrics.</listitem>
+              <listitem><para>Strongly consistent reads/writes:  HBase is not an "eventually consistent" DataStore.  This
+              makes it very suitable for tasks such as high-speed counter aggregation.</para>  </listitem>
+              <listitem><para>Automatic sharding:  HBase tables are distributed on the cluster via regions, and regions are
+              automatically split and re-distributed as your data grows.</para></listitem>
+              <listitem><para>Automatic RegionServer failover</para></listitem>
+              <listitem><para>Hadoop/HDFS Integration:  HBase supports HDFS out of the box as its distributed file system.</para></listitem>
+              <listitem><para>MapReduce:  HBase supports massively parallelized processing via MapReduce for using HBase as both
+              source and sink.</para></listitem>
+              <listitem><para>Java Client API:  HBase supports an easy to use Java API for programmatic access.</para></listitem>
+              <listitem><para>Thrift/REST API:  HBase also supports Thrift and REST for non-Java front-ends.</para></listitem>
+              <listitem><para>Block Cache and Bloom Filters:  HBase supports a Block Cache and Bloom Filters for high volume query optimization.</para></listitem>
+              <listitem><para>Operational Management:  HBase provides build-in web-pages for operational insight as well as JMX metrics.</para></listitem>
             </itemizedlist>
 	  </para>
       </section>
@@ -1140,15 +1143,15 @@ if (!b) {
        </para>
        <para>Key:
             <itemizedlist>
-              <listitem>.META. region key (<code>.META.,,1</code>)</listitem>
+              <listitem><para>.META. region key (<code>.META.,,1</code>)</para></listitem>
             </itemizedlist>
        </para>
        <para>Values:
             <itemizedlist>
-              <listitem><code>info:regioninfo</code> (serialized <link xlink:href="http://hbase.apache.org/apidocs/org/apache/hadoop/hbase/HRegionInfo.html">HRegionInfo</link>
-               instance of .META.)</listitem>
-              <listitem><code>info:server</code> (server:port of the RegionServer holding .META.)</listitem>
-              <listitem><code>info:serverstartcode</code> (start-time of the RegionServer process holding .META.)</listitem>
+              <listitem><para><code>info:regioninfo</code> (serialized <link xlink:href="http://hbase.apache.org/apidocs/org/apache/hadoop/hbase/HRegionInfo.html">HRegionInfo</link>
+               instance of .META.)</para></listitem>
+              <listitem><para><code>info:server</code> (server:port of the RegionServer holding .META.)</para></listitem>
+              <listitem><para><code>info:serverstartcode</code> (start-time of the RegionServer process holding .META.)</para></listitem>
             </itemizedlist>
        </para>
 	   </section>
@@ -1158,16 +1161,16 @@ if (!b) {
        </para>
        <para>Key:
             <itemizedlist>
-              <listitem>Region key of the format (<code>[table],[region start key],[region id]</code>)</listitem>
+              <listitem><para>Region key of the format (<code>[table],[region start key],[region id]</code>)</para></listitem>
             </itemizedlist>
        </para>
        <para>Values:
             <itemizedlist>
-              <listitem><code>info:regioninfo</code> (serialized <link xlink:href="http://hbase.apache.org/apidocs/org/apache/hadoop/hbase/HRegionInfo.html">
-              HRegionInfo</link> instance for this region)
+              <listitem><para><code>info:regioninfo</code> (serialized <link xlink:href="http://hbase.apache.org/apidocs/org/apache/hadoop/hbase/HRegionInfo.html">
+              HRegionInfo</link> instance for this region)</para>
               </listitem>
-              <listitem><code>info:server</code> (server:port of the RegionServer containing this region)</listitem>
-              <listitem><code>info:serverstartcode</code> (start-time of the RegionServer process containing this region)</listitem>
+              <listitem><para><code>info:server</code> (server:port of the RegionServer containing this region)</para></listitem>
+              <listitem><para><code>info:serverstartcode</code> (start-time of the RegionServer process containing this region)</para></listitem>
             </itemizedlist>
        </para>
        <para>When a table is in the process of splitting two other columns will be created, <code>info:splitA</code> and <code>info:splitB</code>
@@ -1351,7 +1354,7 @@ scan.setFilter(filter);
           See the Oracle JavaDoc for <link xlink:href="http://download.oracle.com/javase/6/docs/api/java/util/regex/Pattern.html">supported RegEx patterns in Java</link>.
           </para>
         </section>
-        <section xml:id="client.filter.cvp.rcs"><title>SubstringComparator</title>
+        <section xml:id="client.filter.cvp.SubStringComparator"><title>SubstringComparator</title>
           <para><link xlink:href="http://hbase.apache.org/apidocs/org/apache/hadoop/hbase/filter/SubstringComparator.html">SubstringComparator</link>
           can be used to determine if a given substring exists in a value.  The comparison is case-insensitive.
           </para>
@@ -1518,12 +1521,12 @@ rs.close();
        <section xml:id="master.api"><title>Interface</title>
          <para>The methods exposed by <code>HMasterInterface</code> are primarily metadata-oriented methods:
          <itemizedlist>
-            <listitem>Table (createTable, modifyTable, removeTable, enable, disable)
-            </listitem>
-            <listitem>ColumnFamily (addColumn, modifyColumn, removeColumn)
-            </listitem>
-            <listitem>Region (move, assign, unassign)
-            </listitem>
+            <listitem><para>Table (createTable, modifyTable, removeTable, enable, disable)
+            </para></listitem>
+            <listitem><para>ColumnFamily (addColumn, modifyColumn, removeColumn)
+            </para></listitem>
+            <listitem><para>Region (move, assign, unassign)
+            </para></listitem>
          </itemizedlist>
          For example, when the <code>HBaseAdmin</code> method <code>disableTable</code> is invoked, it is serviced by the Master server.
          </para>
@@ -1551,9 +1554,9 @@ rs.close();
        <section xml:id="regionserver.arch.api"><title>Interface</title>
          <para>The methods exposed by <code>HRegionRegionInterface</code> contain both data-oriented and region-maintenance methods:
          <itemizedlist>
-            <listitem>Data (get, put, delete, next, etc.)
+            <listitem><para>Data (get, put, delete, next, etc.)</para>
             </listitem>
-            <listitem>Region (splitRegion, compactRegion, etc.)
+            <listitem><para>Region (splitRegion, compactRegion, etc.)</para>
             </listitem>
          </itemizedlist>
          For example, when the <code>HBaseAdmin</code> method <code>majorCompact</code> is invoked on a table, the client is actually iterating through
@@ -1597,14 +1600,14 @@ rs.close();
         <para>The Block Cache is an LRU cache that contains three levels of block priority to allow for scan-resistance and in-memory ColumnFamilies:
         </para>
         <itemizedlist>
-            <listitem>Single access priority: The first time a block is loaded from HDFS it normally has this priority and it will be part of the first group to be considered
-            during evictions. The advantage is that scanned blocks are more likely to get evicted than blocks that are getting more usage.
+            <listitem><para>Single access priority: The first time a block is loaded from HDFS it normally has this priority and it will be part of the first group to be considered
+            during evictions. The advantage is that scanned blocks are more likely to get evicted than blocks that are getting more usage.</para>
             </listitem>
-            <listitem>Multi access priority: If a block in the previous priority group is accessed
-              again, it upgrades to this priority. It is thus part of the second group considered
-              during evictions. </listitem>
-            <listitem>In-memory access priority: If the block's family was configured to be "in-memory", it will be part of this priority disregarding the number of times it
-            was accessed. Catalog tables are configured like this. This group is the last one considered during evictions.
+            <listitem><para>Mutli access priority: If a block in the previous priority group is accessed again, it upgrades to this priority. It is thus part of the second group
+            considered during evictions.</para>
+            </listitem>
+            <listitem><para>In-memory access priority: If the block's family was configured to be "in-memory", it will be part of this priority disregarding the number of times it
+            was accessed. Catalog tables are configured like this. This group is the last one considered during evictions.</para>
             </listitem>
         </itemizedlist>
         <para>
@@ -1628,27 +1631,27 @@ rs.close();
         make the process blocking from the point where it loads new blocks. Here are some examples:
         </para>
         <itemizedlist>
-            <listitem>One region server with the default heap size (1GB) and the default block cache size will have 217MB of block cache available.
+            <listitem><para>One region server with the default heap size (1GB) and the default block cache size will have 217MB of block cache available.</para>
             </listitem>
-            <listitem>20 region servers with the heap size set to 8GB and a default block cache size will have 34GB of block cache.
+            <listitem><para>20 region servers with the heap size set to 8GB and a default block cache size will have 34GB of block cache.</para>
             </listitem>
-            <listitem>100 region servers with the heap size set to 24GB and a block cache size of 0.5 will have about 1TB of block cache.
+            <listitem><para>100 region servers with the heap size set to 24GB and a block cache size of 0.5 will have about 1TB of block cache.</para>
             </listitem>
         </itemizedlist>
         <para>Your data isn't the only resident of the block cache, here are others that you may have to take into account:
         </para>
         <itemizedlist>
-            <listitem>Catalog tables: The -ROOT- and .META. tables are forced into the block cache and have the in-memory priority which means that they are harder to evict. The former never uses
-            more than a few hundreds of bytes while the latter can occupy a few MBs (depending on the number of regions).
+            <listitem><para>Catalog tables: The -ROOT- and .META. tables are forced into the block cache and have the in-memory priority which means that they are harder to evict. The former never uses
+            more than a few hundreds of bytes while the latter can occupy a few MBs (depending on the number of regions).</para>
             </listitem>
-            <listitem>HFiles indexes: HFile is the file format that HBase uses to store data in HDFS and it contains a multi-layered index in order seek to the data without having to read the whole file.
+            <listitem><para>HFiles indexes: HFile is the file format that HBase uses to store data in HDFS and it contains a multi-layered index in order seek to the data without having to read the whole file.
             The size of those indexes is a factor of the block size (64KB by default), the size of your keys and the amount of data you are storing. For big data sets it's not unusual to see numbers around
-            1GB per region server, although not all of it will be in cache because the LRU will evict indexes that aren't used.
+            1GB per region server, although not all of it will be in cache because the LRU will evict indexes that aren't used.</para>
             </listitem>
-            <listitem>Keys: Taking into account only the values that are being stored is missing half the picture since every value is stored along with its keys
-            (row key, family, qualifier, and timestamp). See <xref linkend="keysize"/>.
+            <listitem><para>Keys: Taking into account only the values that are being stored is missing half the picture since every value is stored along with its keys
+            (row key, family, qualifier, and timestamp). See <xref linkend="keysize"/>.</para>
             </listitem>
-            <listitem>Bloom filters: Just like the HFile indexes, those data structures (when enabled) are stored in the LRU.
+            <listitem><para>Bloom filters: Just like the HFile indexes, those data structures (when enabled) are stored in the LRU.</para>
             </listitem>
             </itemizedlist>
         <para>Currently the recommended way to measure HFile indexes and bloom filters sizes is to look at the region server web UI and checkout the relevant metrics. For keys,
@@ -1658,14 +1661,14 @@ rs.close();
         but you need to process 1TB of data. One of the reasons is that the churn generated by the evictions will trigger more garbage collections unnecessarily. Here are two use cases:
         </para>
         <itemizedlist>
-            <listitem>Fully random reading pattern: This is a case where you almost never access the same row twice within a short amount of time such that the chance of hitting a cached block is close
+            <listitem><para>Fully random reading pattern: This is a case where you almost never access the same row twice within a short amount of time such that the chance of hitting a cached block is close
             to 0. Setting block caching on such a table is a waste of memory and CPU cycles, more so that it will generate more garbage to pick up by the JVM. For more information on monitoring GC,
-            see <xref linkend="trouble.log.gc"/>.
+            see <xref linkend="trouble.log.gc"/>.</para>
             </listitem>
-            <listitem>Mapping a table: In a typical MapReduce job that takes a table in input, every row will be read only once so there's no need to put them into the block cache. The Scan object has
+            <listitem><para>Mapping a table: In a typical MapReduce job that takes a table in input, every row will be read only once so there's no need to put them into the block cache. The Scan object has
             the option of turning this off via the setCaching method (set it to false). You can still keep block caching turned on on this table if you need fast random read access. An example would be
             counting the number of rows in a table that serves live traffic, caching every block of that table would create massive churn and would surely evict data that's currently in use.
-            </listitem>
+            </para></listitem>
         </itemizedlist>
       </section>
       <section xml:id="offheap.blockcache"><title>Offheap Block Cache</title>
@@ -1687,7 +1690,7 @@ rs.close();
         This ensures that HBase has durable writes. Without WAL, there is the possibility of data loss in the case of a RegionServer failure
         before each MemStore is flushed and new StoreFiles are written.  <link xlink:href="http://hbase.apache.org/apidocs/org/apache/hadoop/hbase/regionserver/wal/HLog.html">HLog</link>
         is the HBase WAL implementation, and there is one HLog instance per RegionServer.
-       </para>The WAL is in HDFS in <filename>/hbase/.logs/</filename> with subdirectories per region.
+       </para><para>The WAL is in HDFS in <filename>/hbase/.logs/</filename> with subdirectories per region.</para>
        <para>
         For more general information about the concept of write ahead logs, see the Wikipedia
         <link xlink:href="http://en.wikipedia.org/wiki/Write-ahead_logging">Write-Ahead Log</link> article.
@@ -1759,13 +1762,14 @@ rs.close();
      For a description of what HBase files look like when written to HDFS, see <xref linkend="trouble.namenode.hbase.objects"/>.
             </para>
     <section xml:id="arch.regions.size">
+      <title>Considerations for Number of Regions</title>
 <para> In general, HBase is designed to run with a small (20-200) number of relatively large (5-20Gb) regions per server. The considerations for this are as follows:</para>
 <section xml:id="too_many_regions">
           <title>Why cannot I have too many regions?</title>
           <para>
               Typically you want to keep your region count low on HBase for numerous reasons.
               Usually right around 100 regions per RegionServer has yielded the best results.
-              Here are some of the reasons below for keeping region count low:
+              Here are some of the reasons below for keeping region count low:</para>
               <orderedlist>
                   <listitem><para>
                           MSLAB requires 2mb per memstore (that's 2mb per family per region).
@@ -1795,12 +1799,13 @@ rs.close();
                           creating memory pressure or OOME on the RSs
                   </para></listitem>
           </orderedlist>
-      </para>
+            <para>Another issue is the effect of the number of regions on mapreduce jobs; it is typical to have one mapper per HBase region.
+              Thus, hosting only 5 regions per RS may not be enough to get sufficient number of tasks for a mapreduce job, while 1000 regions will generate far too many tasks.
+            </para>
+            <para>See <xref linkend="ops.capacity.regions" /> for configuration guidelines.</para>
+
       </section>
-      <para>Another issue is the effect of the number of regions on mapreduce jobs; it is typical to have one mapper per HBase region.
-          Thus, hosting only 5 regions per RS may not be enough to get sufficient number of tasks for a mapreduce job, while 1000 regions will generate far too many tasks.
-      </para>
-      <para>See <xref linkend="ops.capacity.regions" /> for configuration guidelines.</para>
+
     </section>
 
       <section xml:id="regions.arch.assignment">
@@ -1812,18 +1817,18 @@ rs.close();
           <title>Startup</title>
           <para>When HBase starts regions are assigned as follows (short version):
             <orderedlist>
-              <listitem>The Master invokes the <code>AssignmentManager</code> upon startup.
+              <listitem><para>The Master invokes the <code>AssignmentManager</code> upon startup.</para>
               </listitem>
-              <listitem>The <code>AssignmentManager</code> looks at the existing region assignments in META.
+              <listitem><para>The <code>AssignmentManager</code> looks at the existing region assignments in META.</para>
               </listitem>
-              <listitem>If the region assignment is still valid (i.e., if the RegionServer is still online)
-                then the assignment is kept.
+              <listitem><para>If the region assignment is still valid (i.e., if the RegionServer is still online)
+                then the assignment is kept.</para>
               </listitem>
-              <listitem>If the assignment is invalid, then the <code>LoadBalancerFactory</code> is invoked to assign the
-                region.  The <code>DefaultLoadBalancer</code> will randomly assign the region to a RegionServer.
+              <listitem><para>If the assignment is invalid, then the <code>LoadBalancerFactory</code> is invoked to assign the
+                region.  The <code>DefaultLoadBalancer</code> will randomly assign the region to a RegionServer.</para>
               </listitem>
-              <listitem>META is updated with the RegionServer assignment (if needed) and the RegionServer start codes
-              (start time of the RegionServer process) upon region opening by the RegionServer.
+              <listitem><para>META is updated with the RegionServer assignment (if needed) and the RegionServer start codes
+              (start time of the RegionServer process) upon region opening by the RegionServer.</para>
               </listitem>
            </orderedlist>
           </para>
@@ -1833,12 +1838,12 @@ rs.close();
           <title>Failover</title>
           <para>When a RegionServer fails (short version):
             <orderedlist>
-              <listitem>The regions immediately become unavailable because the RegionServer is down.
+              <listitem><para>The regions immediately become unavailable because the RegionServer is down.</para>
               </listitem>
-              <listitem>The Master will detect that the RegionServer has failed.
+              <listitem><para>The Master will detect that the RegionServer has failed.</para>
               </listitem>
-              <listitem>The region assignments will be considered invalid and will be re-assigned just
-                like the startup sequence.
+              <listitem><para>The region assignments will be considered invalid and will be re-assigned just
+                like the startup sequence.</para>
               </listitem>
             </orderedlist>
            </para>
@@ -1856,18 +1861,19 @@ rs.close();
       <section xml:id="regions.arch.locality">
         <title>Region-RegionServer Locality</title>
         <para>Over time, Region-RegionServer locality is achieved via HDFS block replication.
-          The HDFS client does the following by default when choosing locations to write replicas:
+          The HDFS client does the following by default when choosing locations to write replicas:</para>
            <orderedlist>
-             <listitem>First replica is written to local node
+             <listitem><para>First replica is written to local node</para>
              </listitem>
-             <listitem>Second replica is written to a random node on another rack
+             <listitem><para>Second replica is written to a random node on another rack</para>
              </listitem>
-             <listitem>Third replica is written on the same rack as the second, but on a different node chosen randomly
+             <listitem><para>Third replica is written on the same rack as the second, but on a different node chosen randomly</para>
              </listitem>
-             <listitem>Subsequent replicas are written on random nodes on the cluster
+             <listitem><para>Subsequent replicas are written on random nodes on the cluster
 <footnote><para>See <emphasis>Replica Placement: The First Baby Steps</emphasis> on this page: <link xlink:href="http://hadoop.apache.org/docs/stable/hadoop-project-dist/hadoop-hdfs/HdfsDesign.html">HDFS Architecture</link></para></footnote>
-             </listitem>
+             </para></listitem>
            </orderedlist>
+        <para>
           Thus, HBase eventually achieves locality for a region after a flush or a compaction.
           In a RegionServer failover situation a RegionServer may be assigned regions with non-local
           StoreFiles (because none of the replicas are local), however as new data is written
@@ -1949,7 +1955,7 @@ myHtd.setValue(HTableDescriptor.SPLIT_POLICY, MyCustomSplitPolicy.class.getName(
               the SSTable file described in the <link xlink:href="http://research.google.com/archive/bigtable.html">BigTable [2006]</link> paper and on
               Hadoop's <link xlink:href="http://hadoop.apache.org/common/docs/current/api/org/apache/hadoop/io/file/tfile/TFile.html">tfile</link>
               (The unit test suite and the compression harness were taken directly from tfile).
-              Schubert Zhang's blog post on <link xlink:ref="http://cloudepr.blogspot.com/2009/09/hfile-block-indexed-file-format-to.html">HFile: A Block-Indexed File Format to Store Sorted Key-Value Pairs</link> makes for a thorough introduction to HBase's hfile.  Matteo Bertozzi has also put up a
+              Schubert Zhang's blog post on <link xlink:href="http://cloudepr.blogspot.com/2009/09/hfile-block-indexed-file-format-to.html">HFile: A Block-Indexed File Format to Store Sorted Key-Value Pairs</link> makes for a thorough introduction to HBase's hfile.  Matteo Bertozzi has also put up a
               helpful description, <link xlink:href="http://th30z.blogspot.com/2011/02/hbase-io-hfile.html?spref=tw">HBase I/O: HFile</link>.
           </para>
           <para>For more information, see the <link xlink:href="http://hbase.apache.org/xref/org/apache/hadoop/hbase/io/hfile/HFile.html">HFile source code</link>.
@@ -1992,21 +1998,21 @@ myHtd.setValue(HTableDescriptor.SPLIT_POLICY, MyCustomSplitPolicy.class.getName(
         </para>
         <para>The KeyValue format inside a byte array is:
            <itemizedlist>
-             <listitem>keylength</listitem>
-             <listitem>valuelength</listitem>
-             <listitem>key</listitem>
-             <listitem>value</listitem>
+             <listitem><para>keylength</para></listitem>
+             <listitem><para>valuelength</para></listitem>
+             <listitem><para>key</para></listitem>
+             <listitem><para>value</para></listitem>
            </itemizedlist>
         </para>
         <para>The Key is further decomposed as:
            <itemizedlist>
-             <listitem>rowlength</listitem>
-             <listitem>row (i.e., the rowkey)</listitem>
-             <listitem>columnfamilylength</listitem>
-             <listitem>columnfamily</listitem>
-             <listitem>columnqualifier</listitem>
-             <listitem>timestamp</listitem>
-             <listitem>keytype (e.g., Put, Delete, DeleteColumn, DeleteFamily)</listitem>
+             <listitem><para>rowlength</para></listitem>
+             <listitem><para>row (i.e., the rowkey)</para></listitem>
+             <listitem><para>columnfamilylength</para></listitem>
+             <listitem><para>columnfamily</para></listitem>
+             <listitem><para>columnqualifier</para></listitem>
+             <listitem><para>timestamp</para></listitem>
+             <listitem><para>keytype (e.g., Put, Delete, DeleteColumn, DeleteFamily)</para></listitem>
            </itemizedlist>
         </para>
         <para>KeyValue instances are <emphasis>not</emphasis> split across blocks.
@@ -2016,37 +2022,38 @@ myHtd.setValue(HTableDescriptor.SPLIT_POLICY, MyCustomSplitPolicy.class.getName(
         <section xml:id="keyvalue.example"><title>Example</title>
           <para>To emphasize the points above, examine what happens with two Puts for two different columns for the same row:</para>
            <itemizedlist>
-             <listitem>Put #1:  <code>rowkey=row1, cf:attr1=value1</code></listitem>
-             <listitem>Put #2:  <code>rowkey=row1, cf:attr2=value2</code></listitem>
+             <listitem><para>Put #1:  <code>rowkey=row1, cf:attr1=value1</code></para></listitem>
+             <listitem><para>Put #2:  <code>rowkey=row1, cf:attr2=value2</code></para></listitem>
              </itemizedlist>
           <para>Even though these are for the same row, a KeyValue is created for each column:</para>
           <para>Key portion for Put #1:
            <itemizedlist>
-             <listitem>rowlength <code>------------&gt; 4</code></listitem>
-             <listitem>row <code>-----------------&gt; row1</code></listitem>
-             <listitem>columnfamilylength <code>---&gt; 2</code></listitem>
-             <listitem>columnfamily <code>--------&gt; cf</code></listitem>
-             <listitem>columnqualifier <code>------&gt; attr1</code></listitem>
-             <listitem>timestamp <code>-----------&gt; server time of Put</code></listitem>
-             <listitem>keytype <code>-------------&gt; Put</code></listitem>
+             <listitem><para>rowlength <code>------------&gt; 4</code></para></listitem>
+             <listitem><para>row <code>-----------------&gt; row1</code></para></listitem>
+             <listitem><para>columnfamilylength <code>---&gt; 2</code></para></listitem>
+             <listitem><para>columnfamily <code>--------&gt; cf</code></para></listitem>
+             <listitem><para>columnqualifier <code>------&gt; attr1</code></para></listitem>
+             <listitem><para>timestamp <code>-----------&gt; server time of Put</code></para></listitem>
+             <listitem><para>keytype <code>-------------&gt; Put</code></para></listitem>
            </itemizedlist>
           </para>
           <para>Key portion for Put #2:
            <itemizedlist>
-             <listitem>rowlength <code>------------&gt; 4</code></listitem>
-             <listitem>row <code>-----------------&gt; row1</code></listitem>
-             <listitem>columnfamilylength <code>---&gt; 2</code></listitem>
-             <listitem>columnfamily <code>--------&gt; cf</code></listitem>
-             <listitem>columnqualifier <code>------&gt; attr2</code></listitem>
-             <listitem>timestamp <code>-----------&gt; server time of Put</code></listitem>
-             <listitem>keytype <code>-------------&gt; Put</code></listitem>
+             <listitem><para>rowlength <code>------------&gt; 4</code></para></listitem>
+             <listitem><para>row <code>-----------------&gt; row1</code></para></listitem>
+             <listitem><para>columnfamilylength <code>---&gt; 2</code></para></listitem>
+             <listitem><para>columnfamily <code>--------&gt; cf</code></para></listitem>
+             <listitem><para>columnqualifier <code>------&gt; attr2</code></para></listitem>
+             <listitem><para>timestamp <code>-----------&gt; server time of Put</code></para></listitem>
+             <listitem><para>keytype <code>-------------&gt; Put</code></para></listitem>
            </itemizedlist>
            <!--  trying to get the above arrows to line up at the same horizontal position has proven
            harder than I thought -->
           </para>
+          <para>It is critical to understand that the rowkey, ColumnFamily, and column (aka columnqualifier) are embedded within
+            the KeyValue instance.  The longer these identifiers are, the bigger the KeyValue is.</para>
         </section>
-       <para>It is critical to understand that the rowkey, ColumnFamily, and column (aka columnqualifier) are embedded within
-       the KeyValue instance.  The longer these identifiers are, the bigger the KeyValue is.</para>
+
       </section>
       <section xml:id="compaction">
         <title>Compaction</title>
@@ -2078,16 +2085,16 @@ myHtd.setValue(HTableDescriptor.SPLIT_POLICY, MyCustomSplitPolicy.class.getName(
 </programlisting>
           Important knobs:
           <itemizedlist>
-            <listitem><code>hbase.store.compaction.ratio</code> Ratio used in compaction
-            file selection algorithm (default 1.2f). </listitem>
-            <listitem><code>hbase.hstore.compaction.min</code> (.90 hbase.hstore.compactionThreshold) (files) Minimum number
-            of StoreFiles per Store to be selected for a compaction to occur (default 2).</listitem>
-            <listitem><code>hbase.hstore.compaction.max</code> (files) Maximum number of StoreFiles to compact per minor compaction (default 10).</listitem>
-            <listitem><code>hbase.hstore.compaction.min.size</code> (bytes)
+            <listitem><para><code>hbase.store.compaction.ratio</code> Ratio used in compaction
+            file selection algorithm (default 1.2f).</para> </listitem>
+            <listitem><para><code>hbase.hstore.compaction.min</code> (.90 hbase.hstore.compactionThreshold) (files) Minimum number
+            of StoreFiles per Store to be selected for a compaction to occur (default 2).</para></listitem>
+            <listitem><para><code>hbase.hstore.compaction.max</code> (files) Maximum number of StoreFiles to compact per minor compaction (default 10).</para></listitem>
+            <listitem><para><code>hbase.hstore.compaction.min.size</code> (bytes)
             Any StoreFile smaller than this setting with automatically be a candidate for compaction.  Defaults to
-            <code>hbase.hregion.memstore.flush.size</code> (128 mb). </listitem>
-            <listitem><code>hbase.hstore.compaction.max.size</code> (.92) (bytes)
-            Any StoreFile larger than this setting with automatically be excluded from compaction (default Long.MAX_VALUE). </listitem>
+            <code>hbase.hregion.memstore.flush.size</code> (128 mb). </para></listitem>
+            <listitem><para><code>hbase.hstore.compaction.max.size</code> (.92) (bytes)
+            Any StoreFile larger than this setting with automatically be excluded from compaction (default Long.MAX_VALUE). </para></listitem>
             </itemizedlist>
           </para>
           <para>The minor compaction StoreFile selection logic is size based, and selects a file for compaction when the file
@@ -2096,26 +2103,27 @@ myHtd.setValue(HTableDescriptor.SPLIT_POLICY, MyCustomSplitPolicy.class.getName(
         </section>
         <section xml:id="compaction.file.selection.example1">
           <title>Minor Compaction File Selection - Example #1 (Basic Example)</title>
-          <para>This example mirrors an example from the unit test <code>TestCompactSelection</code>.
+          <para>This example mirrors an example from the unit test <code>TestCompactSelection</code>.</para>
           <itemizedlist>
-            <listitem><code>hbase.store.compaction.ratio</code> = 1.0f </listitem>
-            <listitem><code>hbase.hstore.compaction.min</code> = 3 (files) </listitem>>
-            <listitem><code>hbase.hstore.compaction.max</code> = 5 (files) </listitem>>
-            <listitem><code>hbase.hstore.compaction.min.size</code> = 10 (bytes) </listitem>>
-            <listitem><code>hbase.hstore.compaction.max.size</code> = 1000 (bytes) </listitem>>
+            <listitem><para><code>hbase.store.compaction.ratio</code> = 1.0f </para></listitem>
+            <listitem><para><code>hbase.hstore.compaction.min</code> = 3 (files) </para></listitem>
+            <listitem><para><code>hbase.hstore.compaction.max</code> = 5 (files) </para></listitem>
+            <listitem><para><code>hbase.hstore.compaction.min.size</code> = 10 (bytes) </para></listitem>
+            <listitem><para><code>hbase.hstore.compaction.max.size</code> = 1000 (bytes) </para></listitem>
           </itemizedlist>
+          <para>
           The following StoreFiles exist: 100, 50, 23, 12, and 12 bytes apiece (oldest to newest).
           With the above parameters, the files that would be selected for minor compaction are 23, 12, and 12.
           </para>
           <para>Why?
           <itemizedlist>
-            <listitem>100 --&gt;  No, because sum(50, 23, 12, 12) * 1.0 = 97. </listitem>
-            <listitem>50 --&gt;  No, because sum(23, 12, 12) * 1.0 = 47. </listitem>
-            <listitem>23 --&gt;  Yes, because sum(12, 12) * 1.0 = 24. </listitem>
-            <listitem>12 --&gt;  Yes, because the previous file has been included, and because this
-          does not exceed the the max-file limit of 5  </listitem>
-            <listitem>12 --&gt;  Yes, because the previous file had been included, and because this
-          does not exceed the the max-file limit of 5.</listitem>
+            <listitem><para>100 --&gt;  No, because sum(50, 23, 12, 12) * 1.0 = 97. </para></listitem>
+            <listitem><para>50 --&gt;  No, because sum(23, 12, 12) * 1.0 = 47. </para></listitem>
+            <listitem><para>23 --&gt;  Yes, because sum(12, 12) * 1.0 = 24. </para></listitem>
+            <listitem><para>12 --&gt;  Yes, because the previous file has been included, and because this
+          does not exceed the the max-file limit of 5  </para></listitem>
+            <listitem><para>12 --&gt;  Yes, because the previous file had been included, and because this
+          does not exceed the the max-file limit of 5.</para></listitem>
           </itemizedlist>
           </para>
         </section>
@@ -2123,11 +2131,11 @@ myHtd.setValue(HTableDescriptor.SPLIT_POLICY, MyCustomSplitPolicy.class.getName(
           <title>Minor Compaction File Selection - Example #2 (Not Enough Files To Compact)</title>
           <para>This example mirrors an example from the unit test <code>TestCompactSelection</code>.
           <itemizedlist>
-            <listitem><code>hbase.store.compaction.ratio</code> = 1.0f </listitem>
-            <listitem><code>hbase.hstore.compaction.min</code> = 3 (files) </listitem>>
-            <listitem><code>hbase.hstore.compaction.max</code> = 5 (files) </listitem>>
-            <listitem><code>hbase.hstore.compaction.min.size</code> = 10 (bytes) </listitem>>
-            <listitem><code>hbase.hstore.compaction.max.size</code> = 1000 (bytes) </listitem>>
+            <listitem><para><code>hbase.store.compaction.ratio</code> = 1.0f </para></listitem>
+            <listitem><para><code>hbase.hstore.compaction.min</code> = 3 (files) </para></listitem>
+            <listitem><para><code>hbase.hstore.compaction.max</code> = 5 (files)</para> </listitem>
+            <listitem><para><code>hbase.hstore.compaction.min.size</code> = 10 (bytes) </para></listitem>
+            <listitem><para><code>hbase.hstore.compaction.max.size</code> = 1000 (bytes) </para></listitem>
           </itemizedlist>
           </para>
           <para>The following StoreFiles exist: 100, 25, 12, and 12 bytes apiece (oldest to newest).
@@ -2135,35 +2143,35 @@ myHtd.setValue(HTableDescriptor.SPLIT_POLICY, MyCustomSplitPolicy.class.getName(
           </para>
           <para>Why?
           <itemizedlist>
-            <listitem>100 --&gt; No, because sum(25, 12, 12) * 1.0 = 47</listitem>
-            <listitem>25 --&gt;  No, because sum(12, 12) * 1.0 = 24</listitem>
-            <listitem>12 --&gt;  No. Candidate because sum(12) * 1.0 = 12, there are only 2 files to compact and that is less than the threshold of 3</listitem>
-            <listitem>12 --&gt;  No. Candidate because the previous StoreFile was, but there are not enough files to compact</listitem>
+            <listitem><para>100 --&gt; No, because sum(25, 12, 12) * 1.0 = 47</para></listitem>
+            <listitem><para>25 --&gt;  No, because sum(12, 12) * 1.0 = 24</para></listitem>
+            <listitem><para>12 --&gt;  No. Candidate because sum(12) * 1.0 = 12, there are only 2 files to compact and that is less than the threshold of 3</para></listitem>
+            <listitem><para>12 --&gt;  No. Candidate because the previous StoreFile was, but there are not enough files to compact</para></listitem>
           </itemizedlist>
           </para>
         </section>
-        <section xml:id="compaction.file.selection.example2">
+        <section xml:id="compaction.file.selection.example3">
           <title>Minor Compaction File Selection - Example #3 (Limiting Files To Compact)</title>
           <para>This example mirrors an example from the unit test <code>TestCompactSelection</code>.
           <itemizedlist>
-            <listitem><code>hbase.store.compaction.ratio</code> = 1.0f </listitem>
-            <listitem><code>hbase.hstore.compaction.min</code> = 3 (files) </listitem>>
-            <listitem><code>hbase.hstore.compaction.max</code> = 5 (files) </listitem>>
-            <listitem><code>hbase.hstore.compaction.min.size</code> = 10 (bytes) </listitem>>
-            <listitem><code>hbase.hstore.compaction.max.size</code> = 1000 (bytes) </listitem>>
+            <listitem><para><code>hbase.store.compaction.ratio</code> = 1.0f </para></listitem>
+            <listitem><para><code>hbase.hstore.compaction.min</code> = 3 (files) </para></listitem>
+            <listitem><para><code>hbase.hstore.compaction.max</code> = 5 (files)</para> </listitem>
+            <listitem><para><code>hbase.hstore.compaction.min.size</code> = 10 (bytes) </para></listitem>
+            <listitem><para><code>hbase.hstore.compaction.max.size</code> = 1000 (bytes) </para></listitem>
           </itemizedlist>
           The following StoreFiles exist: 7, 6, 5, 4, 3, 2, and 1 bytes apiece (oldest to newest).
           With the above parameters, the files that would be selected for minor compaction are 7, 6, 5, 4, 3.
           </para>
           <para>Why?
           <itemizedlist>
-            <listitem>7 --&gt;  Yes, because sum(6, 5, 4, 3, 2, 1) * 1.0 = 21.  Also, 7 is less than the min-size</listitem>
-            <listitem>6 --&gt;  Yes, because sum(5, 4, 3, 2, 1) * 1.0 = 15.  Also, 6 is less than the min-size. </listitem>
-            <listitem>5 --&gt;  Yes, because sum(4, 3, 2, 1) * 1.0 = 10.  Also, 5 is less than the min-size. </listitem>
-            <listitem>4 --&gt;  Yes, because sum(3, 2, 1) * 1.0 = 6.  Also, 4 is less than the min-size. </listitem>
-            <listitem>3 --&gt;  Yes, because sum(2, 1) * 1.0 = 3.  Also, 3 is less than the min-size. </listitem>
-            <listitem>2 --&gt;  No.  Candidate because previous file was selected and 2 is less than the min-size, but the max-number of files to compact has been reached. </listitem>
-            <listitem>1 --&gt;  No.  Candidate because previous file was selected and 1 is less than the min-size, but max-number of files to compact has been reached. </listitem>
+            <listitem><para>7 --&gt;  Yes, because sum(6, 5, 4, 3, 2, 1) * 1.0 = 21.  Also, 7 is less than the min-size</para></listitem>
+            <listitem><para>6 --&gt;  Yes, because sum(5, 4, 3, 2, 1) * 1.0 = 15.  Also, 6 is less than the min-size. </para></listitem>
+            <listitem><para>5 --&gt;  Yes, because sum(4, 3, 2, 1) * 1.0 = 10.  Also, 5 is less than the min-size. </para></listitem>
+            <listitem><para>4 --&gt;  Yes, because sum(3, 2, 1) * 1.0 = 6.  Also, 4 is less than the min-size. </para></listitem>
+            <listitem><para>3 --&gt;  Yes, because sum(2, 1) * 1.0 = 3.  Also, 3 is less than the min-size. </para></listitem>
+            <listitem><para>2 --&gt;  No.  Candidate because previous file was selected and 2 is less than the min-size, but the max-number of files to compact has been reached. </para></listitem>
+            <listitem><para>1 --&gt;  No.  Candidate because previous file was selected and 1 is less than the min-size, but max-number of files to compact has been reached. </para></listitem>
           </itemizedlist>
           </para>
         </section>
@@ -2187,11 +2195,11 @@ This feature is fully compatible with default compactions - it can be enabled fo
 </section><section xml:id="ops.stripe.when"><title>When to use</title>
 <para>You might want to consider using this feature if you have:
 <itemizedlist>
-<listitem>
-large regions (in that case, you can get the positive effect of much smaller regions without additional memstore and region management overhead); or
-</listitem><listitem>
+<listitem><para>large regions (in that case, you can get the positive effect of much smaller regions without additional memstore and region management overhead); or
+</para></listitem>
+  <listitem><para>
 non-uniform row keys, e.g. time dimension in a key (in that case, only the stripes receiving the new keys will keep compacting - old data will not compact as much, or at all).
-</listitem>
+</para></listitem>
 </itemizedlist>
 </para><para>
 According to perf testing performed, in these case the read performance can improve somewhat, and the read and write performance variability due to compactions is greatly reduced. There's overall perf improvement on large, non-uniform row key regions (hash-prefixed timestamp key) over long term. All of these performance gains are best realized when table is already large. In future, the perf improvement might also extend to region splits.
@@ -2226,21 +2234,23 @@ Based on your region sizing, you might want to also change your stripe sizing. B
 You can improve this pattern for your data. You should generally aim at stripe size of at least 1Gb, and about 8-12 stripes for uniform row keys - so, for example if your regions are 30 Gb, 12x2.5Gb stripes might be a good idea.
 </para><para>
 The settings are as follows:
-<table frame='all'><tgroup cols='2' align='left' colsep='1' rowsep='1'><colspec colname='c1'/><colspec colname='c2'/>
+<informaltable frame='all'><tgroup cols='2' align='left' colsep='1' rowsep='1'><colspec colname='c1'/><colspec colname='c2'/>
 <thead><row><entry>Setting</entry><entry>Notes</entry></row></thead>
 <tbody>
 <row><entry>
 <varname>hbase.store.stripe.initialStripeCount</varname>
 </entry><entry>
-Initial stripe count to create. You can use it as follows:
-<itemizedlist>
-<listitem>
+<para>Initial stripe count to create. You can use it as follows:
+</para><itemizedlist>
+<listitem><para>
 for relatively uniform row keys, if you know the approximate target number of stripes from the above, you can avoid some splitting overhead by starting w/several stripes (2, 5, 10...). Note that if the early data is not representative of overall row key distribution, this will not be as efficient.
-</listitem><listitem>
+</para></listitem>
+  <listitem><para>
 for existing tables with lots of data, you can use this to pre-split stripes.
-</listitem><listitem>
-for e.g. hash-prefixed sequential keys, with more than one hash prefix per region, you know that some pre-splitting makes sense.
-</listitem>
+</para></listitem>
+  <listitem>
+<para>for e.g. hash-prefixed sequential keys, with more than one hash prefix per region, you know that some pre-splitting makes sense.
+</para></listitem>
 </itemizedlist>
 </entry></row><row><entry>
 <varname>hbase.store.stripe.sizeToSplit</varname>
@@ -2252,7 +2262,7 @@ Maximum stripe size before it's split. You can use this in conjunction with the
 The number of new stripes to create when splitting one. The default is 2, and is good for most cases. For non-uniform row keys, you might experiment with increasing the number somewhat (3-4), to isolate the arriving updates into narrower slice of the region with just one split instead of several.
 </entry></row>
 </tbody>
-</tgroup></table>
+</tgroup></informaltable>
 </para>
 </section><section xml:id="ops.stripe.config.memstore"><title>Memstore sizing</title>
 <para>
@@ -2354,7 +2364,7 @@ All the settings that apply to normal compactions (file size limits, etc.) apply
         where <code>importtsv</code> or your MapReduce job put its results, and
         the table name to import into. For example:
       </para>
-      <code>$ hadoop jar hbase-VERSION.jar completebulkload [-c /path/to/hbase/config/hbase-site.xml] /user/todd/myoutput mytable</code>
+      <screen>$ hadoop jar hbase-VERSION.jar completebulkload [-c /path/to/hbase/config/hbase-site.xml] /user/todd/myoutput mytable</screen>
       <para>
         The <code>-c config-file</code> option can be used to specify a file
         containing the appropriate hbase parameters (e.g., hbase-site.xml) if
@@ -2374,7 +2384,7 @@ All the settings that apply to normal compactions (file size limits, etc.) apply
       <para>For more information about the referenced utilities, see <xref linkend="importtsv"/> and  <xref linkend="completebulkload"/>.
       </para>
       <para>
-          See <link xlink:ref="http://blog.cloudera.com/blog/2013/09/how-to-use-hbase-bulk-loading-and-why/">How-to: Use HBase Bulk Loading, and Why</link>
+          See <link xlink:href="http://blog.cloudera.com/blog/2013/09/how-to-use-hbase-bulk-loading-and-why/">How-to: Use HBase Bulk Loading, and Why</link>
           for a recent blog on current state of bulk loading.
       </para>
     </section>
@@ -2422,12 +2432,11 @@ All the settings that apply to normal compactions (file size limits, etc.) apply
   <xi:include xmlns:xi="http://www.w3.org/2001/XInclude" href="ops_mgt.xml"/>
   <xi:include xmlns:xi="http://www.w3.org/2001/XInclude" href="developer.xml"/>
   <xi:include xmlns:xi="http://www.w3.org/2001/XInclude" href="zookeeper.xml" />
-  <xi:include xmlns:xi="http://www.w3.org/2001/XInclude" href="cp.xml" />
   <xi:include xmlns:xi="http://www.w3.org/2001/XInclude" href="community.xml" />
 
 <appendix xml:id="faq">
     <title >FAQ</title>
-    <qandaset defaultlabel='faq'>
+    <qandaset defaultlabel='qanda'>
         <qandadiv><title>General</title>
         <qandaentry>
                 <question><para>When should I use HBase?</para></question>
@@ -2488,7 +2497,7 @@ All the settings that apply to normal compactions (file size limits, etc.) apply
                 </para>
             </answer>
             </qandaentry>
-        <qandaentry xml:id="faq.config.started">
+        <qandaentry xml:id="faq.config.options">
             <question><para>Where can I learn about the rest of the configuration options?</para></question>
             <answer>
                 <para>
@@ -2629,7 +2638,7 @@ identifying mode and a multi-phase read-write repair mode.
 	</para>
 	<section>
 	  <title>Running hbck to identify inconsistencies</title>
-To check to see if your HBase cluster has corruptions, run hbck against your HBase cluster:
+<para>To check to see if your HBase cluster has corruptions, run hbck against your HBase cluster:</para>
 <programlisting>
 $ ./bin/hbase hbck
 </programlisting>
@@ -2645,9 +2654,9 @@ listing of all the splits present in all the tables.
 <programlisting>
 $ ./bin/hbase hbck -details
 </programlisting>
-If you just want to know if some tables are corrupted, you can limit hbck to identify inconsistencies
+<para>If you just want to know if some tables are corrupted, you can limit hbck to identify inconsistencies
 in only specific tables. For example the following command would only attempt to check table
-TableFoo and TableBar. The benefit is that hbck will run in less time.
+TableFoo and TableBar. The benefit is that hbck will run in less time.</para>
 <programlisting>
 $ ./bin/hbase hbck TableFoo TableBar
 </programlisting>
@@ -2662,12 +2671,12 @@ the hbck tool enabled with automatic repair options.
 	There are two invariants that when violated create inconsistencies in HBase:
 	</para>
 	<itemizedlist>
-	  <listitem>HBase’s region consistency invariant is satisfied if every region is assigned and
+	  <listitem><para>HBase’s region consistency invariant is satisfied if every region is assigned and
 deployed on exactly one region server, and all places where this state kept is in
-accordance.
+accordance.</para>
 	</listitem>
-	<listitem>HBase’s table integrity invariant is satisfied if for each table, every possible row key
-resolves to exactly one region.
+	<listitem><para>HBase’s table integrity invariant is satisfied if for each table, every possible row key
+resolves to exactly one region.</para>
 	</listitem>
 	</itemizedlist>
 	<para>
@@ -2698,11 +2707,11 @@ Region consistency requires that the HBase instance has the state of the region
 (.regioninfo files), the region’s row in the .META. table., and region’s deployment/assignments on
 region servers and the master in accordance. Options for repairing region consistency include:
 	<itemizedlist>
-		<listitem><code>-fixAssignments</code> (equivalent to the 0.90 <code>-fix</code> option) repairs unassigned, incorrectly
-assigned or multiply assigned regions.
+		<listitem><para><code>-fixAssignments</code> (equivalent to the 0.90 <code>-fix</code> option) repairs unassigned, incorrectly
+assigned or multiply assigned regions.</para>
 		</listitem>
-		<listitem><code>-fixMeta</code> which removes meta rows when corresponding regions are not present in
-HDFS and adds new meta rows if they regions are present in HDFS while not in META.
+		<listitem><para><code>-fixMeta</code> which removes meta rows when corresponding regions are not present in
+		  HDFS and adds new meta rows if they regions are present in HDFS while not in META.</para>
 		</listitem>
 	</itemizedlist>
 	To fix deployment and assignment problems you can run this command:
@@ -2710,48 +2719,48 @@ HDFS and adds new meta rows if they regions are present in HDFS while not in MET
 <programlisting>
 $ ./bin/hbase hbck -fixAssignments
 </programlisting>
-To fix deployment and assignment problems as well as repairing incorrect meta rows you can
-run this command:.
+<para>To fix deployment and assignment problems as well as repairing incorrect meta rows you can
+run this command:</para>
 <programlisting>
 $ ./bin/hbase hbck -fixAssignments -fixMeta
 </programlisting>
-There are a few classes of table integrity problems that are low risk repairs. The first two are
+<para>There are a few classes of table integrity problems that are low risk repairs. The first two are
 degenerate (startkey == endkey) regions and backwards regions (startkey > endkey). These are
 automatically handled by sidelining the data to a temporary directory (/hbck/xxxx).
-The third low-risk class is hdfs region holes. This can be repaired by using the:
+The third low-risk class is hdfs region holes. This can be repaired by using the:</para>
 	<itemizedlist>
-		<listitem><code>-fixHdfsHoles</code> option for fabricating new empty regions on the file system.
-If holes are detected you can use -fixHdfsHoles and should include -fixMeta and -fixAssignments to make the new region consistent.
+		<listitem><para><code>-fixHdfsHoles</code> option for fabricating new empty regions on the file system.
+If holes are detected you can use -fixHdfsHoles and should include -fixMeta and -fixAssignments to make the new region consistent.</para>
 		</listitem>
 	</itemizedlist>
 <programlisting>
 $ ./bin/hbase hbck -fixAssignments -fixMeta -fixHdfsHoles
 </programlisting>
-Since this is a common operation, we’ve added a the <code>-repairHoles</code> flag that is equivalent to the
-previous command:
+<para>Since this is a common operation, we’ve added a the <code>-repairHoles</code> flag that is equivalent to the
+previous command:</para>
 <programlisting>
 $ ./bin/hbase hbck -repairHoles
 </programlisting>
-If inconsistencies still remain after these steps, you most likely have table integrity problems
-related to orphaned or overlapping regions.
+<para>If inconsistencies still remain after these steps, you most likely have table integrity problems
+related to orphaned or overlapping regions.</para>
 	</section>
 	<section><title>Region Overlap Repairs</title>
-Table integrity problems can require repairs that deal with overlaps. This is a riskier operation
+<para>Table integrity problems can require repairs that deal with overlaps. This is a riskier operation
 because it requires modifications to the file system, requires some decision making, and may
 require some manual steps. For these repairs it is best to analyze the output of a <code>hbck -details</code>
 run so that you isolate repairs attempts only upon problems the checks identify. Because this is
 riskier, there are safeguard that should be used to limit the scope of the repairs.
 WARNING: This is a relatively new and have only been tested on online but idle HBase instances
 (no reads/writes). Use at your own risk in an active production environment!
-The options for repairing table integrity violations include:
+The options for repairing table integrity violations include:</para>
 	<itemizedlist>
-		<listitem><code>-fixHdfsOrphans</code> option for “adopting” a region directory that is missing a region
-metadata file (the .regioninfo file).
+		<listitem><para><code>-fixHdfsOrphans</code> option for “adopting” a region directory that is missing a region
+metadata file (the .regioninfo file).</para>
 		</listitem>
-		<listitem><code>-fixHdfsOverlaps</code> ability for fixing overlapping regions
+		<listitem><para><code>-fixHdfsOverlaps</code> ability for fixing overlapping regions</para>
 		</listitem>
 	</itemizedlist>
-When repairing overlapping regions, a region’s data can be modified on the file system in two
+<para>When repairing overlapping regions, a region’s data can be modified on the file system in two
 ways: 1) by merging regions into a larger region or 2) by sidelining regions by moving data to
 “sideline” directory where data could be restored later. Merging a large number of regions is
 technically correct but could result in an extremely large region that requires series of costly
@@ -2760,58 +2769,58 @@ that overlap with the most other regions (likely the largest ranges) so that mer
 a more reasonable scale. Since these sidelined regions are already laid out in HBase’s native
 directory and HFile format, they can be restored by using HBase’s bulk load mechanism.
 The default safeguard thresholds are conservative. These options let you override the default
-thresholds and to enable the large region sidelining feature.
+thresholds and to enable the large region sidelining feature.</para>
 	<itemizedlist>
-		<listitem><code>-maxMerge &lt;n&gt;</code> maximum number of overlapping regions to merge
+		<listitem><para><code>-maxMerge &lt;n&gt;</code> maximum number of overlapping regions to merge</para>
 		</listitem>
-		<listitem><code>-sidelineBigOverlaps</code> if more than maxMerge regions are overlapping, sideline attempt
-to sideline the regions overlapping with the most other regions.
+		<listitem><para><code>-sidelineBigOverlaps</code> if more than maxMerge regions are overlapping, sideline attempt
+to sideline the regions overlapping with the most other regions.</para>
 		</listitem>
-		<listitem><code>-maxOverlapsToSideline &lt;n&gt;</code> if sidelining large overlapping regions, sideline at most n
-regions.
+		<listitem><para><code>-maxOverlapsToSideline &lt;n&gt;</code> if sidelining large overlapping regions, sideline at most n
+regions.</para>
 		</listitem>
 	</itemizedlist>
 
-Since often times you would just want to get the tables repaired, you can use this option to turn
-on all repair options:
+<para>Since often times you would just want to get the tables repaired, you can use this option to turn
+on all repair options:</para>
 	<itemizedlist>
-		<listitem><code>-repair</code> includes all the region consistency options and only the hole repairing table
-integrity options.
+		<listitem><para><code>-repair</code> includes all the region consistency options and only the hole repairing table
+integrity options.</para>
 		</listitem>
 	</itemizedlist>
-Finally, there are safeguards to limit repairs to only specific tables. For example the following
-command would only attempt to check and repair table TableFoo and TableBar.
-<programlisting>
+<para>Finally, there are safeguards to limit repairs to only specific tables. For example the following
+command would only attempt to check and repair table TableFoo and TableBar.</para>
+<screen>
 $ ./bin/hbase hbck -repair TableFoo TableBar
-</programlisting>
+</screen>
 	<section><title>Special cases: Meta is not properly assigned</title>
-There are a few special cases that hbck can handle as well.
+<para>There are a few special cases that hbck can handle as well.
 Sometimes the meta table’s only region is inconsistently assigned or deployed. In this case
-there is a special <code>-fixMetaOnly</code> option that can try to fix meta assignments.
-<programlisting>
+there is a special <code>-fixMetaOnly</code> option that can try to fix meta assignments.</para>
+<screen>
 $ ./bin/hbase hbck -fixMetaOnly -fixAssignments
-</programlisting>
+</screen>
 	</section>
 	<section><title>Special cases: HBase version file is missing</title>
-HBase’s data on the file system requires a version file in order to start. If this flie is missing, you
+<para>HBase’s data on the file system requires a version file in order to start. If this flie is missing, you
 can use the <code>-fixVersionFile</code> option to fabricating a new HBase version file. This assumes that
-the version of hbck you are running is the appropriate version for the HBase cluster.
+the version of hbck you are running is the appropriate version for the HBase cluster.</para>
 	</section>
 	<section><title>Special case: Root and META are corrupt.</title>
-The most drastic corruption scenario is the case where the ROOT or META is corrupted and
+<para>The most drastic corruption scenario is the case where the ROOT or META is corrupted and
 HBase will not start. In this case you can use the OfflineMetaRepair tool create new ROOT
 and META regions and tables.
 This tool assumes that HBase is offline. It then marches through the existing HBase home
 directory, loads as much information from region metadata files (.regioninfo files) as possible
 from the file system. If the region metadata has proper table integrity, it sidelines the original root
 and meta table directories, and builds new ones with pointers to the region directories and their
-data.
-<programlisting>
+data.</para>
+<screen>
 $ ./bin/hbase org.apache.hadoop.hbase.util.hbck.OfflineMetaRepair
-</programlisting>
-NOTE: This tool is not as clever as uberhbck but can be used to bootstrap repairs that uberhbck
+</screen>
+<para>NOTE: This tool is not as clever as uberhbck but can be used to bootstrap repairs that uberhbck
 can complete.
-If the tool succeeds you should be able to start hbase and run online repairs if necessary.
+If the tool succeeds you should be able to start hbase and run online repairs if necessary.</para>
 	</section>
 	<section><title>Special cases: Offline split parent</title>
     <para>
@@ -3022,15 +3031,12 @@ hbase> describe 't1'</programlisting>
    <section><title>HFile format version 1 overview </title><para>As we will be discussing the changes we are making to the HFile format, it is useful to give a short overview of the previous (HFile version 1) format. An HFile in the existing format is structured as follows:
            <inlinemediaobject>
                <imageobject>
-                   <imagedata align="middle" valign="middle" fileref="hfile.png" />
+                   <imagedata align="center" valign="middle" fileref="hfile.png" />
                </imageobject>
                <textobject>
                  <phrase>HFile Version 1</phrase>
                </textobject>
-               <caption>
-                   <para>HFile Version 1
-                 </para>
-               </caption>
+               
            </inlinemediaobject>
            <footnote><para>Image courtesy of Lars George, <link xlink:href="http://www.larsgeorge.com/2009/10/hbase-architecture-101-storage.html">hbase-architecture-101-storage.html</link>.</para></footnote>
        </para>
@@ -3065,15 +3071,11 @@ hbase> describe 't1'</programlisting>
    <para>The version of HBase introducing the above features reads both version 1 and 2 HFiles, but only writes version 2 HFiles. A version 2 HFile is structured as follows:
            <inlinemediaobject>
                <imageobject>
-                   <imagedata align="middle" valign="middle" fileref="hfilev2.png" />
+                   <imagedata align="center" valign="middle" fileref="hfilev2.png" />
                </imageobject>
                <textobject>
                  <phrase>HFile Version 2</phrase>
                </textobject>
-               <caption>
-                   <para>HFile Version 2
-                 </para>
-               </caption>
            </inlinemediaobject>
 
    </para>
@@ -3341,7 +3343,7 @@ Comparator class used for Bloom filter keys, a UTF>8 encoded string stored   usi
       </orderedlist>
       </listitem>
    </orderedlist></section><section><title>File Info format in versions 1 and 2</title>
-   <para>The file info block is a serialized <ulink url="http://hbase.apache.org/apidocs/org/apache/hadoop/hbase/io/HbaseMapWritable.html">HbaseMapWritable</ulink> (essentially a map from byte arrays to byte arrays) with the following keys, among others. StoreFile-level logic adds more keys to this.</para>
+   <para>The file info block is a serialized <link xlink:href="http://hbase.apache.org/apidocs/org/apache/hadoop/hbase/io/HbaseMapWritable.html">HbaseMapWritable</link> (essentially a map from byte arrays to byte arrays) with the following keys, among others. StoreFile-level logic adds more keys to this.</para>
    <informaltable frame="all">
       <tgroup cols="2"><tbody><row>
             <entry>
@@ -3479,8 +3481,8 @@ Comparator class used for Bloom filter keys, a UTF>8 encoded string stored   usi
      <para>In HBASE-7845, we generate a new key that is lexicographically larger than the last key of the previous block and lexicographically equal or smaller than the start key of the current block. While actual keys can potentially be very long, this "fake key" or "virtual key" can be much shorter. For example, if the stop key of previous block is "the quick brown fox", the start key of current block is "the who", we could use "the r" as our virtual key in our hfile index.</para>
      <para>There are two benefits to this:</para>
      <itemizedlist>
-     <listitem><section>having shorter keys reduces the hfile index size, (allowing us to keep more indexes in memory), and</section></listitem>
-     <listitem><section>using something closer to the end key of the previous block allows us to avoid a potential extra IO when the target key lives in between the "virtual key" and the key of the first element in the target block.</section></listitem>
+     <listitem><para>having shorter keys reduces the hfile index size, (allowing us to keep more indexes in memory), and</para></listitem>
+     <listitem><para>using something closer to the end key of the previous block allows us to avoid a potential extra IO when the target key lives in between the "virtual key" and the key of the first element in the target block.</para></listitem>
      </itemizedlist>
      <para>This optimization (implemented by the getShortMidpointKey method) is inspired by LevelDB's ByteWiseComparatorImpl::FindShortestSeparator() and FindShortSuccessor().</para>
    </section></section></appendix>
@@ -3490,10 +3492,10 @@ Comparator class used for Bloom filter keys, a UTF>8 encoded string stored   usi
        <section xml:id="other.info.videos"><title>HBase Videos</title>
          <para>Introduction to HBase
             <itemizedlist>
-              <listitem><link xlink:href="http://www.cloudera.com/content/cloudera/en/resources/library/presentation/chicago_data_summit_apache_hbase_an_introduction_todd_lipcon.html">Introduction to HBase</link> by Todd Lipcon (Chicago Data Summit 2011).
-			  </listitem>
-			  <listitem><link xlink:href="http://www.cloudera.com/videos/intorduction-hbase-todd-lipcon">Introduction to HBase</link> by Todd Lipcon (2010).
-			  </listitem>
+              <listitem><para><link xlink:href="http://www.cloudera.com/content/cloudera/en/resources/library/presentation/chicago_data_summit_apache_hbase_an_introduction_todd_lipcon.html">Introduction to HBase</link> by Todd Lipcon (Chicago Data Summit 2011).
+			  </para></listitem>
+			  <listitem><para><link xlink:href="http://www.cloudera.com/videos/intorduction-hbase-todd-lipcon">Introduction to HBase</link> by Todd Lipcon (2010).
+			  </para></listitem>
 			</itemizedlist>
          </para>
          <para><link xlink:href="http://www.cloudera.com/videos/hadoop-world-2011-presentation-video-building-realtime-big-data-services-at-facebook-with-hadoop-and-hbase">Building Real Time Services at Facebook with HBase</link> by Jonathan Gray (Hadoop World 2011).
@@ -3520,8 +3522,8 @@ Comparator class used for Bloom filter keys, a UTF>8 encoded string stored   usi
        <section xml:id="other.info.sites"><title>HBase Sites</title>
          <para><link xlink:href="http://www.cloudera.com/blog/category/hbase/">Cloudera's HBase Blog</link> has a lot of links to useful HBase information.
 		<itemizedlist>
-			<listitem><link xlink:href="http://www.cloudera.com/blog/2010/04/cap-confusion-problems-with-partition-tolerance/">CAP Confusion</link> is a relevant entry for background information on
-			distributed storage systems.
+			<listitem><para><link xlink:href="http://www.cloudera.com/blog/2010/04/cap-confusion-problems-with-partition-tolerance/">CAP Confusion</link> is a relevant entry for background information on
+			distributed storage systems.</para>
 			</listitem>
 		</itemizedlist>
          </para>
@@ -3543,14 +3545,14 @@ Comparator class used for Bloom filter keys, a UTF>8 encoded string stored   usi
 
   <appendix xml:id="hbase.history"><title>HBase History</title>
     <itemizedlist>
-	  <listitem>2006:  <link xlink:href="http://research.google.com/archive/bigtable.html">BigTable</link> paper published by Google.
-	  </listitem>
-	  <listitem>2006 (end of year):  HBase development starts.
-	  </listitem>
-	  <listitem>2008:  HBase becomes Hadoop sub-project.
-	  </listitem>
-	  <listitem>2010:  HBase becomes Apache top-level project.
-	  </listitem>
+	  <listitem><para>2006:  <link xlink:href="http://research.google.com/archive/bigtable.html">BigTable</link> paper published by Google.
+	  </para></listitem>
+	  <listitem><para>2006 (end of year):  HBase development starts.
+	  </para></listitem>
+	  <listitem><para>2008:  HBase becomes Hadoop sub-project.
+	  </para></listitem>
+	  <listitem><para>2010:  HBase becomes Apache top-level project.
+	  </para></listitem>
 	</itemizedlist>
   </appendix>
 
diff --git a/src/main/docbkx/case_studies.xml b/src/main/docbkx/case_studies.xml
index 067a8b59204..15169a8aa43 100644
--- a/src/main/docbkx/case_studies.xml
+++ b/src/main/docbkx/case_studies.xml
@@ -1,13 +1,13 @@
 <?xml version="1.0" encoding="UTF-8"?>
 <chapter version="5.0" xml:id="casestudies"
-         xmlns="http://docbook.org/ns/docbook"
-         xmlns:xlink="http://www.w3.org/1999/xlink"
-         xmlns:xi="http://www.w3.org/2001/XInclude"
-         xmlns:svg="http://www.w3.org/2000/svg"
-         xmlns:m="http://www.w3.org/1998/Math/MathML"
-         xmlns:html="http://www.w3.org/1999/xhtml"
-         xmlns:db="http://docbook.org/ns/docbook">
-<!--
+  xmlns="http://docbook.org/ns/docbook"
+  xmlns:xlink="http://www.w3.org/1999/xlink"
+  xmlns:xi="http://www.w3.org/2001/XInclude"
+  xmlns:svg="http://www.w3.org/2000/svg"
+  xmlns:m="http://www.w3.org/1998/Math/MathML"
+  xmlns:html="http://www.w3.org/1999/xhtml"
+  xmlns:db="http://docbook.org/ns/docbook">
+  <!--
 /**
  * Licensed to the Apache Software Foundation (ASF) under one
  * or more contributor license agreements.  See the NOTICE file
@@ -27,86 +27,86 @@
  */
 -->
   <title>Apache HBase Case Studies</title>
-    <section xml:id="casestudies.overview">
-      <title>Overview</title>
-      <para>This chapter will describe a variety of performance and troubleshooting case studies that can 
+  <section xml:id="casestudies.overview">
+    <title>Overview</title>
+    <para>This chapter will describe a variety of performance and troubleshooting case studies that can 
       provide a useful blueprint on diagnosing Apache HBase cluster issues.</para>
-      <para>For more information on Performance and Troubleshooting, see <xref linkend="performance"/> and <xref linkend="trouble"/>.
-      </para>
-    </section>
-
-    <section xml:id="casestudies.schema">
-    	<title>Schema Design</title>
-    	<para>See the schema design case studies here: <xref linkend="schema.casestudies"/>
-    	</para>
-		
-	</section>   <!--  schema design -->
-
-    <section xml:id="casestudies.perftroub">
-    	<title>Performance/Troubleshooting</title>
-   
+    <para>For more information on Performance and Troubleshooting, see <xref linkend="performance"/> and <xref linkend="trouble"/>.
+    </para>
+  </section>
+  
+  <section xml:id="casestudies.schema">
+    <title>Schema Design</title>
+    <para>See the schema design case studies here: <xref linkend="schema.casestudies"/>
+    </para>
+    
+  </section>   <!--  schema design -->
+  
+  <section xml:id="casestudies.perftroub">
+    <title>Performance/Troubleshooting</title>
+    
     <section xml:id="casestudies.slownode">
       <title>Case Study #1 (Performance Issue On A Single Node)</title>
       <section><title>Scenario</title>
         <para>Following a scheduled reboot, one data node began exhibiting unusual behavior.  Routine MapReduce 
-         jobs run against HBase tables which regularly completed in five or six minutes began taking 30 or 40 minutes 
-         to finish. These jobs were consistently found to be waiting on map and reduce tasks assigned to the troubled data node 
-         (e.g., the slow map tasks all had the same Input Split).           
-         The situation came to a head during a distributed copy, when the copy was severely prolonged by the lagging node.
-		</para>
-       </section>
+          jobs run against HBase tables which regularly completed in five or six minutes began taking 30 or 40 minutes 
+          to finish. These jobs were consistently found to be waiting on map and reduce tasks assigned to the troubled data node 
+          (e.g., the slow map tasks all had the same Input Split).           
+          The situation came to a head during a distributed copy, when the copy was severely prolonged by the lagging node.
+        </para>
+      </section>
       <section><title>Hardware</title>
         <para>Datanodes:
-        <itemizedlist>
-          <listitem>Two 12-core processors</listitem>
-          <listitem>Six Enerprise SATA disks</listitem>
-          <listitem>24GB of RAM</listitem>
-          <listitem>Two bonded gigabit NICs</listitem>
-        </itemizedlist>
+          <itemizedlist>
+            <listitem><para>Two 12-core processors</para></listitem>
+            <listitem><para>Six Enerprise SATA disks</para></listitem>
+            <listitem><para>24GB of RAM</para></listitem>
+            <listitem><para>Two bonded gigabit NICs</para></listitem>
+          </itemizedlist>
         </para>		
         <para>Network:
-        <itemizedlist>
-          <listitem>10 Gigabit top-of-rack switches</listitem>
-          <listitem>20 Gigabit bonded interconnects between racks.</listitem>
-        </itemizedlist>
+          <itemizedlist>
+            <listitem><para>10 Gigabit top-of-rack switches</para></listitem>
+            <listitem><para>20 Gigabit bonded interconnects between racks.</para></listitem>
+          </itemizedlist>
         </para>
       </section>
       <section><title>Hypotheses</title>
-		<section><title>HBase "Hot Spot" Region</title>
-		  <para>We hypothesized that we were experiencing a familiar point of pain: a "hot spot" region in an HBase table, 
-		  where uneven key-space distribution can funnel a huge number of requests to a single HBase region, bombarding the RegionServer 
-		  process and cause slow response time. Examination of the HBase Master status page showed that the number of HBase requests to the 
-		  troubled node was almost zero.  Further, examination of the HBase logs showed that there were no region splits, compactions, or other region transitions 
-		  in progress.  This effectively ruled out a "hot spot" as the root cause of the observed slowness.
+        <section><title>HBase "Hot Spot" Region</title>
+          <para>We hypothesized that we were experiencing a familiar point of pain: a "hot spot" region in an HBase table, 
+            where uneven key-space distribution can funnel a huge number of requests to a single HBase region, bombarding the RegionServer 
+            process and cause slow response time. Examination of the HBase Master status page showed that the number of HBase requests to the 
+            troubled node was almost zero.  Further, examination of the HBase logs showed that there were no region splits, compactions, or other region transitions 
+            in progress.  This effectively ruled out a "hot spot" as the root cause of the observed slowness.
           </para>		
         </section>
-		<section><title>HBase Region With Non-Local Data</title>
-		  <para>Our next hypothesis was that one of the MapReduce tasks was requesting data from HBase that was not local to the datanode, thus 
-		  forcing HDFS to request data blocks from other servers over the network.  Examination of the datanode logs showed that there were very 
-		  few blocks being requested over the network, indicating that the HBase region was correctly assigned, and that the majority of the necessary 
-		  data was located on the node. This ruled out the possibility of non-local data causing a slowdown.
+        <section><title>HBase Region With Non-Local Data</title>
+          <para>Our next hypothesis was that one of the MapReduce tasks was requesting data from HBase that was not local to the datanode, thus 
+            forcing HDFS to request data blocks from other servers over the network.  Examination of the datanode logs showed that there were very 
+            few blocks being requested over the network, indicating that the HBase region was correctly assigned, and that the majority of the necessary 
+            data was located on the node. This ruled out the possibility of non-local data causing a slowdown.
           </para>
         </section>		
-		<section><title>Excessive I/O Wait Due To Swapping Or An Over-Worked Or Failing Hard Disk</title>
+        <section><title>Excessive I/O Wait Due To Swapping Or An Over-Worked Or Failing Hard Disk</title>
           <para>After concluding that the Hadoop and HBase were not likely to be the culprits, we moved on to troubleshooting the datanode's hardware. 
-          Java, by design, will periodically scan its entire memory space to do garbage collection.  If system memory is heavily overcommitted, the Linux 
-          kernel may enter a vicious cycle, using up all of its resources swapping Java heap back and forth from disk to RAM as Java tries to run garbage 
-          collection.  Further, a failing hard disk will often retry reads and/or writes many times before giving up and returning an error. This can manifest 
-          as high iowait, as running processes wait for reads and writes to complete.  Finally, a disk nearing the upper edge of its performance envelope will 
-          begin to cause iowait as it informs the kernel that it cannot accept any more data, and the kernel queues incoming data into the dirty write pool in memory.  
-          However, using <code>vmstat(1)</code> and <code>free(1)</code>, we could see that no swap was being used, and the amount of disk IO was only a few kilobytes per second.
+            Java, by design, will periodically scan its entire memory space to do garbage collection.  If system memory is heavily overcommitted, the Linux 
+            kernel may enter a vicious cycle, using up all of its resources swapping Java heap back and forth from disk to RAM as Java tries to run garbage 
+            collection.  Further, a failing hard disk will often retry reads and/or writes many times before giving up and returning an error. This can manifest 
+            as high iowait, as running processes wait for reads and writes to complete.  Finally, a disk nearing the upper edge of its performance envelope will 
+            begin to cause iowait as it informs the kernel that it cannot accept any more data, and the kernel queues incoming data into the dirty write pool in memory.  
+            However, using <code>vmstat(1)</code> and <code>free(1)</code>, we could see that no swap was being used, and the amount of disk IO was only a few kilobytes per second.
           </para>		
         </section>
-		<section><title>Slowness Due To High Processor Usage</title>
+        <section><title>Slowness Due To High Processor Usage</title>
           <para>Next, we checked to see whether the system was performing slowly simply due to very high computational load.  <code>top(1)</code> showed that the system load 
-          was higher than normal, but <code>vmstat(1)</code> and <code>mpstat(1)</code> showed that the amount of processor being used for actual computation was low.
+            was higher than normal, but <code>vmstat(1)</code> and <code>mpstat(1)</code> showed that the amount of processor being used for actual computation was low.
           </para>	
         </section>	
-		<section><title>Network Saturation (The Winner)</title>
+        <section><title>Network Saturation (The Winner)</title>
           <para>Since neither the disks nor the processors were being utilized heavily, we moved on to the performance of the network interfaces.  The datanode had two 
-          gigabit ethernet adapters, bonded to form an active-standby interface.  <code>ifconfig(8)</code> showed some unusual anomalies, namely interface errors, overruns, framing errors. 
-          While not unheard of, these kinds of errors are exceedingly rare on modern hardware which is operating as it should:
-<programlisting>		
+            gigabit ethernet adapters, bonded to form an active-standby interface.  <code>ifconfig(8)</code> showed some unusual anomalies, namely interface errors, overruns, framing errors. 
+            While not unheard of, these kinds of errors are exceedingly rare on modern hardware which is operating as it should:
+            <programlisting>		
 $ /sbin/ifconfig bond0
 bond0  Link encap:Ethernet  HWaddr 00:00:00:00:00:00  
 inet addr:10.x.x.x  Bcast:10.x.x.255  Mask:255.255.255.0
@@ -118,9 +118,9 @@ RX bytes:2416328868676 (2.4 TB)  TX bytes:3464991094001 (3.4 TB)
 </programlisting>
           </para>		
           <para>These errors immediately lead us to suspect that one or more of the ethernet interfaces might have negotiated the wrong line speed.  This was confirmed both by running an ICMP ping 
-          from an external host and observing round-trip-time in excess of 700ms, and by running <code>ethtool(8)</code> on the members of the bond interface and discovering that the active interface 
-          was operating at 100Mbs/, full duplex.
-<programlisting>		
+            from an external host and observing round-trip-time in excess of 700ms, and by running <code>ethtool(8)</code> on the members of the bond interface and discovering that the active interface 
+            was operating at 100Mbs/, full duplex.
+            <programlisting>		
 $ sudo ethtool eth0
 Settings for eth0:
 Supported ports: [ TP ]
@@ -148,44 +148,44 @@ Wake-on: g
 Current message level: 0x00000003 (3)
 Link detected: yes
 </programlisting>		
-		  </para>
-		  <para>In normal operation, the ICMP ping round trip time should be around 20ms, and the interface speed and duplex should read, "1000MB/s", and, "Full", respectively.  
-		  </para>
-	    </section>
-     </section>  
-   	<section><title>Resolution</title>
-   	  <para>After determining that the active ethernet adapter was at the incorrect speed, we used the <code>ifenslave(8)</code> command to make the standby interface 
-   	  the active interface, which yielded an immediate improvement in MapReduce performance, and a 10 times improvement in network throughput:
-	  </para>
-	  <para>On the next trip to the datacenter, we determined that the line speed issue was ultimately caused by a bad network cable, which was replaced.
-	  </para>
-	</section>
-   </section>  <!--  case study -->
+          </para>
+          <para>In normal operation, the ICMP ping round trip time should be around 20ms, and the interface speed and duplex should read, "1000MB/s", and, "Full", respectively.  
+          </para>
+        </section>
+      </section>  
+      <section><title>Resolution</title>
+        <para>After determining that the active ethernet adapter was at the incorrect speed, we used the <code>ifenslave(8)</code> command to make the standby interface 
+          the active interface, which yielded an immediate improvement in MapReduce performance, and a 10 times improvement in network throughput:
+        </para>
+        <para>On the next trip to the datacenter, we determined that the line speed issue was ultimately caused by a bad network cable, which was replaced.
+        </para>
+      </section>
+    </section>  <!--  case study -->
     <section xml:id="casestudies.perf.1">
       <title>Case Study #2 (Performance Research 2012)</title>
       <para>Investigation results of a self-described "we're not sure what's wrong, but it seems slow" problem. 
-      <link xlink:href="http://gbif.blogspot.com/2012/03/hbase-performance-evaluation-continued.html">http://gbif.blogspot.com/2012/03/hbase-performance-evaluation-continued.html</link>
+        <link xlink:href="http://gbif.blogspot.com/2012/03/hbase-performance-evaluation-continued.html">http://gbif.blogspot.com/2012/03/hbase-performance-evaluation-continued.html</link>
       </para>
     </section>
-
+    
     <section xml:id="casestudies.perf.2">
       <title>Case Study #3 (Performance Research 2010))</title>
       <para>
-      Investigation results of general cluster performance from 2010.  Although this research is on an older version of the codebase, this writeup
-      is still very useful in terms of approach.
-      <link xlink:href="http://hstack.org/hbase-performance-testing/">http://hstack.org/hbase-performance-testing/</link>
+        Investigation results of general cluster performance from 2010.  Although this research is on an older version of the codebase, this writeup
+        is still very useful in terms of approach.
+        <link xlink:href="http://hstack.org/hbase-performance-testing/">http://hstack.org/hbase-performance-testing/</link>
       </para>
     </section>
-
+    
     <section xml:id="casestudies.xceivers">
       <title>Case Study #4 (xcievers Config)</title>
       <para>Case study of configuring <code>xceivers</code>, and diagnosing errors from mis-configurations.
-      <link xlink:href="http://www.larsgeorge.com/2012/03/hadoop-hbase-and-xceivers.html">http://www.larsgeorge.com/2012/03/hadoop-hbase-and-xceivers.html</link>
+        <link xlink:href="http://www.larsgeorge.com/2012/03/hadoop-hbase-and-xceivers.html">http://www.larsgeorge.com/2012/03/hadoop-hbase-and-xceivers.html</link>
       </para>
       <para>See also <xref linkend="dfs.datanode.max.transfer.threads"/>.
       </para>
     </section>
-
-    </section>    <!--  performance/troubleshooting -->
-	
-  </chapter>
+    
+  </section>    <!--  performance/troubleshooting -->
+  
+</chapter>
diff --git a/src/main/docbkx/configuration.xml b/src/main/docbkx/configuration.xml
index 45bc157742b..25e1f1376ad 100644
--- a/src/main/docbkx/configuration.xml
+++ b/src/main/docbkx/configuration.xml
@@ -173,7 +173,7 @@ needed for servers to pick up changes (caveat dynamic config. to be described la
         <footnote>
             <para>A useful read setting config on you hadoop cluster is Aaron
             Kimballs' <link
-            xlink:ref="http://www.cloudera.com/blog/2009/03/configuration-parameters-what-can-you-just-ignore/">Configuration
+            xlink:href="http://www.cloudera.com/blog/2009/03/configuration-parameters-what-can-you-just-ignore/">Configuration
             Parameters: What can you just ignore?</link></para>
           </footnote></para>
 
@@ -527,8 +527,7 @@ homed on the node <varname>h-24-30.example.com</varname>.
 </para>
           <para>Now skip to <xref linkend="confirm" /> for how to start and verify your
           pseudo-distributed install. <footnote>
-              <para>See <xref linkend="pseudo.extras">Pseudo-distributed
-              mode extras</xref> for notes on how to start extra Masters and
+              <para>See <xref linkend="pseudo.extras"/> for notes on how to start extra Masters and
               RegionServers when running pseudo-distributed.</para>
             </footnote></para>
 
@@ -695,11 +694,7 @@ homed on the node <varname>h-24-30.example.com</varname>.
 
         <programlisting>bin/start-hbase.sh</programlisting>
 
-         Run the above from the
-
-        <varname>HBASE_HOME</varname>
-
-         directory.
+         <para>Run the above from the <varname>HBASE_HOME</varname> directory.</para>
 
         <para>You should now have a running HBase instance. HBase logs can be
         found in the <filename>logs</filename> subdirectory. Check them out
@@ -771,7 +766,79 @@ stopping hbase...............</programlisting> Shutdown can take a moment to
     The generated file is a docbook section with a glossary
     in it-->
     <!--presumes the pre-site target has put the hbase-default.xml at this location-->
-    <xi:include xmlns:xi="http://www.w3.org/2001/XInclude" href="../../../target/docbkx/hbase-default.xml" />
+      <xi:include  xmlns:xi="http://www.w3.org/2001/XInclude" href="../../../target/docbkx/hbase-default.xml">
+        <xi:fallback>
+          <section xml:id="hbase_default_configurations">
+            <title></title>
+            <para>
+              <emphasis>This file is fallback content</emphasis>. If you are seeing this, something is wrong with the build of the HBase documentation or you are doing pre-build verification.
+            </para>
+            <para>
+              The file hbase-default.xml is generated as part of
+              the build of the hbase site.  See the hbase <filename>pom.xml</filename>.
+              The generated file is a docbook glossary.
+            </para>
+            <section>
+              <title>IDs that are auto-generated and cause validation errors if not present</title>
+              <para>
+                Each of these is a reference to a configuration file parameter which will cause an error if you are using the fallback content here. This is a dirty dirty hack.
+              </para>
+              <section xml:id="fail.fast.expired.active.master">
+                <title>fail.fast.expired.active.master</title>
+                <para />
+              </section>
+              <section xml:id="hbase.hregion.memstore.flush.size">
+                <title>"hbase.hregion.memstore.flush.size"</title>
+                <para />
+              </section>
+              <section xml:id="hbase.hstore.bytes.per.checksum">
+                <title>hbase.hstore.bytes.per.checksum</title>
+                <para />
+              </section>
+              <section xml:id="hbase.online.schema.update.enable">
+                <title>hbase.online.schema.update.enable</title>
+                <para />
+              </section>
+              <section xml:id="hbase.regionserver.global.memstore.size">
+                <title>hbase.regionserver.global.memstore.size</title>
+                <para />
+              </section>
+              <section xml:id="hbase.hregion.max.filesize">
+                <title>hbase.hregion.max.filesize</title>
+                <para />
+              </section>
+              <section xml:id="hbase.hstore.blockingStoreFiles">
+                <title>hbase.hstore.BlockingStoreFiles</title>
+                <para />
+              </section>
+              <section xml:id="hfile.block.cache.size">
+                <title>hfile.block.cache.size</title>
+                <para />
+              </section>
+              <section xml:id="copy.table">
+                <title>copy.table</title>
+                <para />
+              </section>
+              <section xml:id="hbase.hstore.checksum.algorithm">
+                <title>hbase.hstore.checksum.algorithm</title>
+                <para />
+              </section>
+              <section xml:id="hbase.zookeeper.useMulti">
+                <title>hbase.zookeeper.useMulti</title>
+                <para />
+              </section>
+              <section xml:id="hbase.hregion.memstore.block.multiplier">
+                <title>hbase.hregion.memstore.block.multiplier</title>
+                <para />
+              </section>
+              <section xml:id="hbase.regionserver.global.memstore.size.lower.limit">
+                <title>hbase.regionserver.global.memstore.size.lower.limit</title>
+                <para />
+              </section>
+            </section>
+          </section>
+        </xi:fallback>
+      </xi:include>
     </section>
 
       <section xml:id="hbase.env.sh">
diff --git a/src/main/docbkx/developer.xml b/src/main/docbkx/developer.xml
index dd469b65d60..cedc6a5d399 100644
--- a/src/main/docbkx/developer.xml
+++ b/src/main/docbkx/developer.xml
@@ -118,8 +118,8 @@ git clone git://github.com/apache/hbase.git
             <title>Maven Classpath Variable</title>
             <para>The <varname>M2_REPO</varname> classpath variable needs to be set up for the project.  This needs to be set to
             your local Maven repository, which is usually <filename>~/.m2/repository</filename></para>
-            If this classpath variable is not configured, you will see compile errors in Eclipse like this...
-            <programlisting>
+<para>If this classpath variable is not configured, you will see compile errors in Eclipse like this:
+</para>            <programlisting>
 Description	Resource	Path	Location	Type
 The project cannot be built until build path errors are resolved	hbase		Unknown	Java Problem
 Unbound classpath variable: 'M2_REPO/asm/asm/3.1/asm-3.1.jar' in project 'hbase'	hbase		Build path	Build Path Problem
@@ -223,51 +223,52 @@ mvn compile -Dcompile-protobuf -Dprotoc.path=/opt/local/bin/protoc
              poms when you build. For now, just be aware of the difference between HBase 1.x
              builds and those of HBase 0.96-0.98. Below we will come back to this difference
              when we list out build instructions.</para>
-         </section>
+
+        
 <para xml:id="mvn.settings.file">Publishing to maven requires you sign the artifacts you want to upload.  To have the
          build do this for you, you need to make sure you have a properly configured
          <filename>settings.xml</filename> in your local repository under <filename>.m2</filename>.
             Here is my <filename>~/.m2/settings.xml</filename>.
-        <programlisting>&lt;settings xmlns="http://maven.apache.org/SETTINGS/1.0.0"
+        <programlisting><![CDATA[<settings xmlns="http://maven.apache.org/SETTINGS/1.0.0"
   xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
   xsi:schemaLocation="http://maven.apache.org/SETTINGS/1.0.0
                       http://maven.apache.org/xsd/settings-1.0.0.xsd">
-  &lt;servers>
-    &lt;!- To publish a snapshot of some part of Maven -->
-    &lt;server>
-      &lt;id>apache.snapshots.https&lt;/id>
-      &lt;username>YOUR_APACHE_ID
-      &lt;/username>
-      &lt;password>YOUR_APACHE_PASSWORD
-      &lt;/password>
-    &lt;/server>
-    &lt;!-- To publish a website using Maven -->
-    &lt;!-- To stage a release of some part of Maven -->
-    &lt;server>
-      &lt;id>apache.releases.https&lt;/id>
-      &lt;username>YOUR_APACHE_ID
-      &lt;/username>
-      &lt;password>YOUR_APACHE_PASSWORD
-      &lt;/password>
-    &lt;/server>
-  &lt;/servers>
-  &lt;profiles>
-    &lt;profile>
-      &lt;id>apache-release&lt;/id>
-      &lt;properties>
-    &lt;gpg.keyname>YOUR_KEYNAME&lt;/gpg.keyname>
-    &lt;!--Keyname is something like this ... 00A5F21E... do gpg --list-keys to find it-->
-    &lt;gpg.passphrase>YOUR_KEY_PASSWORD
-    &lt;/gpg.passphrase>
-      &lt;/properties>
-    &lt;/profile>
-  &lt;/profiles>
-&lt;/settings>
+  <servers>
+    <!- To publish a snapshot of some part of Maven -->
+    <server>
+      <id>apache.snapshots.https</id>
+      <username>YOUR_APACHE_ID
+      </username>
+      <password>YOUR_APACHE_PASSWORD
+      </password>
+    </server>
+    <!-- To publish a website using Maven -->
+    <!-- To stage a release of some part of Maven -->
+    <server>
+      <id>apache.releases.https</id>
+      <username>YOUR_APACHE_ID
+      </username>
+      <password>YOUR_APACHE_PASSWORD
+      </password>
+    </server>
+  </servers>
+  <profiles>
+    <profile>
+      <id>apache-release</id>
+      <properties>
+    <gpg.keyname>YOUR_KEYNAME</gpg.keyname>
+    <!--Keyname is something like this ... 00A5F21E... do gpg --list-keys to find it-->
+    <gpg.passphrase>YOUR_KEY_PASSWORD
+    </gpg.passphrase>
+      </properties>
+    </profile>
+  </profiles>
+</settings>]]>
         </programlisting>
         </para>
         <para>You must use maven 3.0.x (Check by running <command>mvn -version</command>).
         </para>
-
+             </section>
      <section xml:id="maven.release">
          <title>Making a Release Candidate</title>
          <para>I'll explain by running through the process.  See later in this section for more detail on particular steps.
@@ -501,17 +502,17 @@ HBase have a character not usually seen in other projects.</para>
                 dependency tree).</para>
   <section xml:id="hbase.moduletest.run">
   <title>Running Tests in other Modules</title>
-  If the module you are developing in has no other dependencies on other HBase modules, then
-  you can cd into that module and just run:
+  <para>If the module you are developing in has no other dependencies on other HBase modules, then
+  you can cd into that module and just run:</para>
   <programlisting>mvn test</programlisting>
-  which will just run the tests IN THAT MODULE. If there are other dependencies on other modules,
+  <para>which will just run the tests IN THAT MODULE. If there are other dependencies on other modules,
   then you will have run the command from the ROOT HBASE DIRECTORY. This will run the tests in the other
   modules, unless you specify to skip the tests in that module. For instance, to skip the tests in the hbase-server module,
-  you would run:
+  you would run:</para>
   <programlisting>mvn clean test -PskipServerTests</programlisting>
-  from the top level directory to run all the tests in modules other than hbase-server. Note that you
+  <para>from the top level directory to run all the tests in modules other than hbase-server. Note that you
   can specify to skip tests in multiple modules as well as just for a single module. For example, to skip
-  the tests in <classname>hbase-server</classname> and <classname>hbase-common</classname>, you would run:
+  the tests in <classname>hbase-server</classname> and <classname>hbase-common</classname>, you would run:</para>
   <programlisting>mvn clean test -PskipServerTests -PskipCommonTests</programlisting>
   <para>Also, keep in mind that if you are running tests in the <classname>hbase-server</classname> module you will need to
   apply the maven profiles discussed in <xref linkend="hbase.unittests.cmds"/> to get the tests to run properly.</para>
@@ -541,7 +542,7 @@ The first three categories, small, medium, and large are for tests run when
 you type <code>$ mvn test</code>; i.e. these three categorizations are for
 HBase unit tests. The integration category is for not for unit tests but for integration
 tests.  These are run when you invoke <code>$ mvn verify</code>.  Integration tests
-are described in <xref linkend="integration.tests">integration tests section</xref> and will not be discussed further
+are described in <xref linkend="integration.tests"/> and will not be discussed further
 in this section on HBase unit tests.</para>
 <para>
 Apache HBase uses a patched maven surefire plugin and maven profiles to implement
@@ -579,7 +580,7 @@ the developer machine as well.
 <section xml:id="hbase.unittests.integration">
 <title>Integration Tests<indexterm><primary>IntegrationTests</primary></indexterm></title>
 <para><emphasis>Integration</emphasis> tests are system level tests. See
-<xref linkend="integration.tests">integration tests section</xref> for more info.
+<xref linkend="integration.tests"/> for more info.
 </para>
 </section>
 </section>
@@ -704,17 +705,17 @@ should not impact these resources, it's worth checking these log lines
 <title>General rules</title>
 <itemizedlist>
 <listitem>
-As much as possible, tests should be written as category small tests.
+<para>As much as possible, tests should be written as category small tests.</para>
 </listitem>
 <listitem>
-All tests must be written to support parallel execution on the same machine, hence they should not use shared resources as fixed ports or fixed file names.
+<para>All tests must be written to support parallel execution on the same machine, hence they should not use shared resources as fixed ports or fixed file names.</para>
 </listitem>
 <listitem>
-Tests should not overlog. More than 100 lines/second makes the logs complex to read and use i/o that are hence not available for the other tests.
+<para>Tests should not overlog. More than 100 lines/second makes the logs complex to read and use i/o that are hence not available for the other tests.</para>
 </listitem>
 <listitem>
-Tests can be written with <classname>HBaseTestingUtility</classname>.
-This class offers helper functions to create a temp directory and do the cleanup, or to start a cluster.
+<para>Tests can be written with <classname>HBaseTestingUtility</classname>.
+This class offers helper functions to create a temp directory and do the cleanup, or to start a cluster.</para>
 </listitem>
 </itemizedlist>
 </section>
@@ -722,19 +723,19 @@ This class offers helper functions to create a temp directory and do the cleanup
 <title>Categories and execution time</title>
 <itemizedlist>
 <listitem>
-All tests must be categorized, if not they could be skipped.
+<para>All tests must be categorized, if not they could be skipped.</para>
 </listitem>
 <listitem>
-All tests should be written to be as fast as possible.
+<para>All tests should be written to be as fast as possible.</para>
 </listitem>
 <listitem>
-Small category tests should last less than 15 seconds, and must not have any side effect.
+<para>Small category tests should last less than 15 seconds, and must not have any side effect.</para>
 </listitem>
 <listitem>
-Medium category tests should last less than 50 seconds.
+<para>Medium category tests should last less than 50 seconds.</para>
 </listitem>
 <listitem>
-Large category tests should last less than 3 minutes.  This should ensure a good parallelization for people using it, and ease the analysis when the test fails.
+<para>Large category tests should last less than 3 minutes.  This should ensure a good parallelization for people using it, and ease the analysis when the test fails.</para>
 </listitem>
 </itemizedlist>
 </section>
@@ -862,17 +863,17 @@ are running other tests.
 </para>
 
 <para>
-ChaosMonkey defines Action's and Policy's. Actions are sequences of events. We have at least the following actions:
+ChaosMonkey defines Action's and Policy's. Actions are sequences of events. We have at least the following actions:</para>
 <itemizedlist>
-<listitem>Restart active master (sleep 5 sec)</listitem>
-<listitem>Restart random regionserver (sleep 5 sec)</listitem>
-<listitem>Restart random regionserver (sleep 60 sec)</listitem>
-<listitem>Restart META regionserver (sleep 5 sec)</listitem>
-<listitem>Restart ROOT regionserver (sleep 5 sec)</listitem>
-<listitem>Batch restart of 50% of regionservers (sleep 5 sec)</listitem>
-<listitem>Rolling restart of 100% of regionservers (sleep 5 sec)</listitem>
+<listitem><para>Restart active master (sleep 5 sec)</para></listitem>
+<listitem><para>Restart random regionserver (sleep 5 sec)</para></listitem>
+<listitem><para>Restart random regionserver (sleep 60 sec)</para></listitem>
+<listitem><para>Restart META regionserver (sleep 5 sec)</para></listitem>
+<listitem><para>Restart ROOT regionserver (sleep 5 sec)</para></listitem>
+<listitem><para>Batch restart of 50% of regionservers (sleep 5 sec)</para></listitem>
+<listitem><para>Rolling restart of 100% of regionservers (sleep 5 sec)</para></listitem>
 </itemizedlist>
-
+<para>
 Policies on the other hand are responsible for executing the actions based on a strategy.
 The default policy is to execute a random action every minute based on predefined action
 weights. ChaosMonkey executes predefined named policies until it is stopped. More than one
@@ -881,11 +882,12 @@ policy can be active at any time.
 
 <para>
   To run ChaosMonkey as a standalone tool deploy your HBase cluster as usual. ChaosMonkey uses the configuration
-from the bin/hbase script, thus no extra configuration needs to be done. You can invoke the ChaosMonkey by running:
+from the bin/hbase script, thus no extra configuration needs to be done. You can invoke the ChaosMonkey by running:</para>
 <programlisting>bin/hbase org.apache.hadoop.hbase.util.ChaosMonkey</programlisting>
-
+<para>
 This will output smt like:
-<programlisting>
+</para>
+<screen>
 12/11/19 23:21:57 INFO util.ChaosMonkey: Using ChaosMonkey Policy: class org.apache.hadoop.hbase.util.ChaosMonkey$PeriodicRandomActionPolicy, period:60000
 12/11/19 23:21:57 INFO util.ChaosMonkey: Sleeping for 26953 to add jitter
 12/11/19 23:22:24 INFO util.ChaosMonkey: Performing action: Restart active master
@@ -921,8 +923,8 @@ This will output smt like:
 12/11/19 23:24:26 INFO hbase.ClusterManager: Executed remote command, exit code:0 , output:starting regionserver, logging to /homes/enis/code/hbase-0.94/bin/../logs/hbase-enis-regionserver-rs3.example.com.out
 
 12/11/19 23:24:27 INFO util.ChaosMonkey: Started region server:rs3.example.com,60020,1353367027826. Reported num of rs:6
-</programlisting>
-
+</screen>
+<para>
 As you can see from the log, ChaosMonkey started the default PeriodicRandomActionPolicy, which is configured with all the available actions, and ran RestartActiveMaster and RestartRandomRs actions. ChaosMonkey tool, if run from command line, will keep on running until the process is killed.
 </para>
 </section>
@@ -958,7 +960,7 @@ mvn compile
          <para>
          The above will build against whatever explicit hadoop 1.x version we have in our <filename>pom.xml</filename> as our '1.0' version.
          Tests may not all pass so you may need to pass <code>-DskipTests</code> unless you are inclined to fix the failing tests.</para>
-<note id="maven.build.passing.default.profile">
+<note xml:id="maven.build.passing.default.profile">
 <title>'dependencyManagement.dependencies.dependency.artifactId' for org.apache.hbase:${compat.module}:test-jar with value '${compat.module}' does not match a valid id pattern</title>
 <para>You will see ERRORs like the above title if you pass the <emphasis>default</emphasis> profile; e.g. if
 you pass <property>hadoop.profile=1.1</property> when building 0.96 or
@@ -1001,12 +1003,12 @@ pecularity that is probably fixable but we've not spent the time trying to figur
           <section xml:id="jira.priorities"><title>Jira Priorities</title>
           <para>The following is a guideline on setting Jira issue priorities:
                 <itemizedlist>
-                <listitem>Blocker: Should only be used if the issue WILL cause data loss or cluster instability reliably.</listitem>
-                <listitem>Critical: The issue described can cause data loss or cluster instability in some cases.</listitem>
-                <listitem>Major: Important but not tragic issues, like updates to the client API that will add a lot of much-needed functionality or significant
-                bugs that need to be fixed but that don't cause data loss.</listitem>
-                <listitem>Minor: Useful enhancements and annoying but not damaging bugs.</listitem>
-                <listitem>Trivial: Useful enhancements but generally cosmetic.</listitem>
+                <listitem><para>Blocker: Should only be used if the issue WILL cause data loss or cluster instability reliably.</para></listitem>
+                <listitem><para>Critical: The issue described can cause data loss or cluster instability in some cases.</para></listitem>
+                <listitem><para>Major: Important but not tragic issues, like updates to the client API that will add a lot of much-needed functionality or significant
+                bugs that need to be fixed but that don't cause data loss.</para></listitem>
+                <listitem><para>Minor: Useful enhancements and annoying but not damaging bugs.</para></listitem>
+                <listitem><para>Trivial: Useful enhancements but generally cosmetic.</para></listitem>
                 </itemizedlist>
              </para>
         </section>
@@ -1161,10 +1163,9 @@ pecularity that is probably fixable but we've not spent the time trying to figur
           <para>Please submit one patch-file per Jira.  For example, if multiple files are changed make sure the
           selected resource when generating the patch is a directory.  Patch files can reflect changes in multiple files. </para>
       <para>
-          Generating patches using git:<sbr/>
-              <programlisting>
-$ git diff --no-prefix  > HBASE_XXXX.patch
-              </programlisting>
+          Generating patches using git:</para>
+<screen>$ git diff --no-prefix  > HBASE_XXXX.patch</screen>
+              <para>
               Don't forget the 'no-prefix' option; and generate the diff from the root directory of project
       </para>
           <para>Make sure you review <xref linkend="eclipse.code.formatting"/> for code style. </para>
@@ -1283,11 +1284,10 @@ Bar bar = foo.getBar();     &lt;--- imagine there's an extra space(s) after the
           </section>
           <section xml:id="common.patch.feedback.javadoc">
             <title>Javadoc</title>
-            <para>This is also a very common feedback item.  Don't forget Javadoc!
+            <para>This is also a very common feedback item.  Don't forget Javadoc!</para>
                 <para>Javadoc warnings are checked during precommit. If the precommit tool gives you a '-1',
                     please fix the javadoc issue. Your patch won't be committed if it adds such warnings.
                 </para>
-            </para>
           </section>
           <section xml:id="common.patch.feedback.findbugs">
             <title>Findbugs</title>
@@ -1345,25 +1345,25 @@ Bar bar = foo.getBar();     &lt;--- imagine there's an extra space(s) after the
             </para>
             <itemizedlist>
                 <listitem>
-                    Do not delete the old patch file
+                    <para>Do not delete the old patch file</para>
                 </listitem>
                 <listitem>
-                    version your new patch file using a simple scheme like this: <sbr/>
-                    HBASE-{jira number}-{version}.patch <sbr/>
-                    e.g:
-                    HBASE_XXXX-v2.patch
+                    <para>version your new patch file using a simple scheme like this:</para>
+                    <screen>HBASE-{jira number}-{version}.patch</screen>
+                    <para>e.g:</para>
+                    <screen>HBASE_XXXX-v2.patch</screen>
                 </listitem>
                 <listitem>
-                    'Cancel Patch' on JIRA.. bug status will change back to Open
+                    <para>'Cancel Patch' on JIRA.. bug status will change back to Open</para>
                 </listitem>
                 <listitem>
-                    Attach new patch file (e.g. HBASE_XXXX-v2.patch) using 'Files --> Attach'
+                    <para>Attach new patch file (e.g. HBASE_XXXX-v2.patch) using 'Files --> Attach'</para>
                 </listitem>
                 <listitem>
-                    Click on 'Submit Patch'.  Now the bug status will say 'Patch Available'.
+                    <para>Click on 'Submit Patch'.  Now the bug status will say 'Patch Available'.</para>
                 </listitem>
             </itemizedlist>
-            Committers will review the patch.  Rinse and repeat as many times as needed :-)
+            <para>Committers will review the patch.  Rinse and repeat as many times as needed :-)</para>
         </section>
 
         <section>
@@ -1372,32 +1372,32 @@ Bar bar = foo.getBar();     &lt;--- imagine there's an extra space(s) after the
                 At times you may want to break a big change into mulitple patches.  Here is a sample work-flow using git
                 <itemizedlist>
                     <listitem>
-                        patch 1:
+                        <para>patch 1:</para>
                         <itemizedlist>
                             <listitem>
-                                $ git diff --no-prefix > HBASE_XXXX-1.patch
+                                <screen>$ git diff --no-prefix > HBASE_XXXX-1.patch</screen>
                             </listitem>
                         </itemizedlist>
                     </listitem>
                     <listitem>
-                        patch 2:
+                        <para>patch 2:</para>
                         <itemizedlist>
                             <listitem>
-                                create a new git branch <sbr/>
-                                $ git checkout -b my_branch
+                                <para>create a new git branch</para>
+                                <screen>$ git checkout -b my_branch</screen>
                             </listitem>
                             <listitem>
-                                save your work
-                                $ git add file1 file2 <sbr/>
-                                $ git commit -am 'saved after HBASE_XXXX-1.patch' <sbr/>
-                                now you have your own branch, that is different from remote master branch <sbr/>
+                                <para>save your work</para>
+                                <screen>$ git add file1 file2 </screen>
+                                <screen>$ git commit -am 'saved after HBASE_XXXX-1.patch'</screen>
+                                <para>now you have your own branch, that is different from remote master branch</para>
                             </listitem>
                             <listitem>
-                                make more changes...
+                                <para>make more changes...</para>
                             </listitem>
                             <listitem>
-                                create second patch <sbr/>
-                                $ git diff --no-prefix > HBASE_XXXX-2.patch
+                                <para>create second patch</para>
+                                <screen>$ git diff --no-prefix > HBASE_XXXX-2.patch</screen>
                             </listitem>
                         </itemizedlist>
 
diff --git a/src/main/docbkx/external_apis.xml b/src/main/docbkx/external_apis.xml
index 9e3ed372798..8ad1c8bcfd2 100644
--- a/src/main/docbkx/external_apis.xml
+++ b/src/main/docbkx/external_apis.xml
@@ -27,8 +27,8 @@
  */
 -->
   <title>Apache HBase External APIs</title>
-  This chapter will cover access to Apache HBase either through non-Java languages, or through custom protocols.
-
+<para>  This chapter will cover access to Apache HBase either through non-Java languages, or through custom protocols.
+</para>
   <section xml:id="nonjava.jvm">
     <title>Non-Java Languages Talking to the JVM</title>
     <para>Currently the documentation on this topic in the
@@ -172,7 +172,7 @@
                <para>Example4:<code> =, 'substring:abc123' </code>will match everything that begins with the substring "abc123"</para>
              </section>
 
-             <section xml:id="example PHP Client Program"><title>Example PHP Client Program that uses the Filter Language</title>
+             <section xml:id="examplePHPClientProgram"><title>Example PHP Client Program that uses the Filter Language</title>
                <programlisting>
 &lt;? $_SERVER['PHP_ROOT'] = realpath(dirname(__FILE__).'/..');
    require_once $_SERVER['PHP_ROOT'].'/flib/__flib.php';
@@ -205,7 +205,7 @@
         </para>
 
         <orderedlist>
-          <para>
+          <listitem>
             <itemizedlist>
               <listitem>
                 <para><code>“(RowFilter (=, ‘binary:Row 1’) AND TimeStampsFilter (74689, 89734)) OR
@@ -216,7 +216,7 @@
                 <para>1) The key-value pair must be in a column that is lexicographically >= abc and &lt; xyz </para>
               </listitem>
             </itemizedlist>
-          </para>
+          </listitem>
         </orderedlist>
 
         <para>
@@ -228,7 +228,7 @@
         </para>
       </section>
 
-      <section xml:id="Individual Filter Syntax"><title>Individual Filter Syntax</title>
+      <section xml:id="IndividualFilterSyntax"><title>Individual Filter Syntax</title>
         <orderedlist>
           <listitem>
             <para><emphasis role="bold"><emphasis role="underline">KeyOnlyFilter</emphasis></emphasis></para>
diff --git a/src/main/docbkx/getting_started.xml b/src/main/docbkx/getting_started.xml
index cd47284c6e3..c99adf8fbce 100644
--- a/src/main/docbkx/getting_started.xml
+++ b/src/main/docbkx/getting_started.xml
@@ -1,13 +1,13 @@
 <?xml version="1.0" encoding="UTF-8"?>
 <chapter version="5.0" xml:id="getting_started"
-         xmlns="http://docbook.org/ns/docbook"
-         xmlns:xlink="http://www.w3.org/1999/xlink"
-         xmlns:xi="http://www.w3.org/2001/XInclude"
-         xmlns:svg="http://www.w3.org/2000/svg"
-         xmlns:m="http://www.w3.org/1998/Math/MathML"
-         xmlns:html="http://www.w3.org/1999/xhtml"
-         xmlns:db="http://docbook.org/ns/docbook">
-<!--
+  xmlns="http://docbook.org/ns/docbook"
+  xmlns:xlink="http://www.w3.org/1999/xlink"
+  xmlns:xi="http://www.w3.org/2001/XInclude"
+  xmlns:svg="http://www.w3.org/2000/svg"
+  xmlns:m="http://www.w3.org/1998/Math/MathML"
+  xmlns:html="http://www.w3.org/1999/xhtml"
+  xmlns:db="http://docbook.org/ns/docbook">
+  <!--
 /**
  * Licensed to the Apache Software Foundation (ASF) under one
  * or more contributor license agreements.  See the NOTICE file
@@ -27,79 +27,78 @@
  */
 -->
   <title>Getting Started</title>
-
+  
   <section>
     <title>Introduction</title>
-
+    
     <para><xref linkend="quickstart" /> will get you up and
-    running on a single-node, standalone instance of HBase.
+      running on a single-node, standalone instance of HBase.
     </para>
   </section>
-
+  
   <section xml:id="quickstart">
     <title>Quick Start</title>
-
+    
     <para>This guide describes setup of a standalone HBase instance. It will
-        run against the local filesystem.  In later sections we will take you through
-        how to run HBase on Apache Hadoop's HDFS, a distributed filesystem.  This section
-        shows you how to create a table in HBase, inserting
-    rows into your new HBase table via the HBase <command>shell</command>, and then cleaning
-    up and shutting down your standalone, local filesystem-based  HBase instance. The below exercise
-    should take no more than ten minutes (not including download time).
+      run against the local filesystem.  In later sections we will take you through
+      how to run HBase on Apache Hadoop's HDFS, a distributed filesystem.  This section
+      shows you how to create a table in HBase, inserting
+      rows into your new HBase table via the HBase <command>shell</command>, and then cleaning
+      up and shutting down your standalone, local filesystem-based  HBase instance. The below exercise
+      should take no more than ten minutes (not including download time).
     </para>
     <note xml:id="local.fs.durability"><title>Local Filesystem and Durability</title>
-        <para>Using HBase with a LocalFileSystem does not currently guarantee durability.
+      <para>Using HBase with a LocalFileSystem does not currently guarantee durability.
         The HDFS local filesystem implementation will lose edits if files are not properly
         closed -- which is very likely to happen when experimenting with a new download.
-            You need to run HBase on HDFS to ensure all writes are preserved.  Running
-            against the local filesystem though will get you off the ground quickly and get you
-            familiar with how the general system works so lets run with it for now. See
-            <link xlink:href="https://issues.apache.org/jira/browse/HBASE-3696"/> and its associated issues for more details.</para></note>
+        You need to run HBase on HDFS to ensure all writes are preserved.  Running
+        against the local filesystem though will get you off the ground quickly and get you
+        familiar with how the general system works so lets run with it for now. See
+        <link xlink:href="https://issues.apache.org/jira/browse/HBASE-3696"/> and its associated issues for more details.</para></note>
     <note xml:id="loopback.ip.getting.started">
-        <title>Loopback IP</title>
-        <note>
-        <para><emphasis>The below advice is for hbase-0.94.x and older versions only. We believe this fixed in hbase-0.96.0 and beyond
-(let us know if we have it wrong).</emphasis>  There should be no need of the below modification to <filename>/etc/hosts</filename> in
-later versions of HBase.</para>
-       </note>
-        <para>HBase expects the loopback IP address to be 127.0.0.1.  Ubuntu and some other distributions,
-            for example, will default to 127.0.1.1 and this will cause problems for you
-            <footnote><para>See <link xlink:href="http://blog.devving.com/why-does-hbase-care-about-etchosts/">Why does HBase care about /etc/hosts?</link> for detail.</para></footnote>.
-        </para>
-        <para><filename>/etc/hosts</filename> should look something like this:
-<programlisting>
+      <title>Loopback IP</title>
+      <para><emphasis>The below advice is for hbase-0.94.x and older versions only. We believe this fixed in hbase-0.96.0 and beyond
+        (let us know if we have it wrong).</emphasis>  There should be no need of the below modification to <filename>/etc/hosts</filename> in
+        later versions of HBase.</para>
+      
+      <para>HBase expects the loopback IP address to be 127.0.0.1.  Ubuntu and some other distributions,
+        for example, will default to 127.0.1.1 and this will cause problems for you
+        <footnote><para>See <link xlink:href="http://blog.devving.com/why-does-hbase-care-about-etchosts/">Why does HBase care about /etc/hosts?</link> for detail.</para></footnote>.
+      </para>
+      <para><filename>/etc/hosts</filename> should look something like this:
+        <programlisting>
             127.0.0.1 localhost
             127.0.0.1 ubuntu.ubuntu-domain ubuntu
 </programlisting>
-        </para>
-       </note>
-
-
+      </para>
+    </note>
+    
+    
     <section>
       <title>Download and unpack the latest stable release.</title>
-
+      
       <para>Choose a download site from this list of <link
-      xlink:href="http://www.apache.org/dyn/closer.cgi/hbase/">Apache Download
-      Mirrors</link>. Click on the suggested top link. This will take you to a
-      mirror of <emphasis>HBase Releases</emphasis>. Click on the folder named
-      <filename>stable</filename> and then download the file that ends in
-      <filename>.tar.gz</filename> to your local filesystem; e.g.
-      <filename>hbase-0.94.2.tar.gz</filename>.</para>
-
+        xlink:href="http://www.apache.org/dyn/closer.cgi/hbase/">Apache Download
+        Mirrors</link>. Click on the suggested top link. This will take you to a
+        mirror of <emphasis>HBase Releases</emphasis>. Click on the folder named
+        <filename>stable</filename> and then download the file that ends in
+        <filename>.tar.gz</filename> to your local filesystem; e.g.
+        <filename>hbase-0.94.2.tar.gz</filename>.</para>
+      
       <para>Decompress and untar your download and then change into the
-      unpacked directory.</para>
-
+        unpacked directory.</para>
+      
       <para><programlisting>$ tar xfz hbase-<?eval ${project.version}?>.tar.gz
 $ cd hbase-<?eval ${project.version}?>
 </programlisting></para>
-
+      
       <para>At this point, you are ready to start HBase. But before starting
-      it, edit <filename>conf/hbase-site.xml</filename>, the file you write
-      your site-specific configurations into. Set
-      <varname>hbase.rootdir</varname>, the directory HBase writes data to,
-      and <varname>hbase.zookeeper.property.dataDir</varname>, the directory
-      ZooKeeper writes its data too:
-<programlisting>&lt;?xml version="1.0"?&gt;
+        it, edit <filename>conf/hbase-site.xml</filename>, the file you write
+        your site-specific configurations into. Set
+        <varname>hbase.rootdir</varname>, the directory HBase writes data to,
+        and <varname>hbase.zookeeper.property.dataDir</varname>, the directory
+        ZooKeeper writes its data too:
+        <programlisting>&lt;?xml version="1.0"?&gt;
 &lt;?xml-stylesheet type="text/xsl" href="configuration.xsl"?&gt;
 &lt;configuration&gt;
   &lt;property&gt;
@@ -111,63 +110,63 @@ $ cd hbase-<?eval ${project.version}?>
     &lt;value&gt;/DIRECTORY/zookeeper&lt;/value&gt;
   &lt;/property&gt;
 &lt;/configuration&gt;</programlisting> Replace <varname>DIRECTORY</varname> in the above with the
-      path to the directory you would have HBase and ZooKeeper write their data. By default,
-      <varname>hbase.rootdir</varname> is set to <filename>/tmp/hbase-${user.name}</filename>
-      and similarly so for the default ZooKeeper data location which means you'll lose all
-      your data whenever your server reboots unless you change it (Most operating systems clear
-      <filename>/tmp</filename> on restart).</para>
+        path to the directory you would have HBase and ZooKeeper write their data. By default,
+        <varname>hbase.rootdir</varname> is set to <filename>/tmp/hbase-${user.name}</filename>
+        and similarly so for the default ZooKeeper data location which means you'll lose all
+        your data whenever your server reboots unless you change it (Most operating systems clear
+        <filename>/tmp</filename> on restart).</para>
     </section>
-
+    
     <section xml:id="start_hbase">
       <title>Start HBase</title>
-
+      
       <para>Now start HBase:<programlisting>$ ./bin/start-hbase.sh
 starting Master, logging to logs/hbase-user-master-example.org.out</programlisting></para>
-
+      
       <para>You should now have a running standalone HBase instance. In
-      standalone mode, HBase runs all daemons in the the one JVM; i.e. both
-      the HBase and ZooKeeper daemons. HBase logs can be found in the
-      <filename>logs</filename> subdirectory. Check them out especially if
-      it seems HBase had trouble starting.</para>
-
+        standalone mode, HBase runs all daemons in the the one JVM; i.e. both
+        the HBase and ZooKeeper daemons. HBase logs can be found in the
+        <filename>logs</filename> subdirectory. Check them out especially if
+        it seems HBase had trouble starting.</para>
+      
       <note>
         <title>Is <application>java</application> installed?</title>
-
+        
         <para>All of the above presumes a 1.6 version of Oracle
-        <application>java</application> is installed on your machine and
-        available on your path (See <xref linkend="java" />); i.e. when you type
-        <application>java</application>, you see output that describes the
-        options the java program takes (HBase requires java 6). If this is not
-        the case, HBase will not start. Install java, edit
-        <filename>conf/hbase-env.sh</filename>, uncommenting the
-        <envar>JAVA_HOME</envar> line pointing it to your java install, then,
-        retry the steps above.</para>
+          <application>java</application> is installed on your machine and
+          available on your path (See <xref linkend="java" />); i.e. when you type
+          <application>java</application>, you see output that describes the
+          options the java program takes (HBase requires java 6). If this is not
+          the case, HBase will not start. Install java, edit
+          <filename>conf/hbase-env.sh</filename>, uncommenting the
+          <envar>JAVA_HOME</envar> line pointing it to your java install, then,
+          retry the steps above.</para>
       </note>
     </section>
-
+    
     <section xml:id="shell_exercises">
       <title>Shell Exercises</title>
-
+      
       <para>Connect to your running HBase via the <command>shell</command>.</para>
-
+      
       <para><programlisting>$ ./bin/hbase shell
 HBase Shell; enter 'help&lt;RETURN&gt;' for list of supported commands.
 Type "exit&lt;RETURN&gt;" to leave the HBase Shell
 Version: 0.90.0, r1001068, Fri Sep 24 13:55:42 PDT 2010
 
 hbase(main):001:0&gt; </programlisting></para>
-
+      
       <para>Type <command>help</command> and then
-      <command>&lt;RETURN&gt;</command> to see a listing of shell commands and
-      options. Browse at least the paragraphs at the end of the help emission
-      for the gist of how variables and command arguments are entered into the
-      HBase shell; in particular note how table names, rows, and columns,
-      etc., must be quoted.</para>
-
-  <para>Create a table named <varname>test</varname> with a single column family named <varname>cf</varname>.
-      Verify its creation by listing all tables and then insert some
-      values.</para>
-
+        <command>&lt;RETURN&gt;</command> to see a listing of shell commands and
+        options. Browse at least the paragraphs at the end of the help emission
+        for the gist of how variables and command arguments are entered into the
+        HBase shell; in particular note how table names, rows, and columns,
+        etc., must be quoted.</para>
+      
+      <para>Create a table named <varname>test</varname> with a single column family named <varname>cf</varname>.
+        Verify its creation by listing all tables and then insert some
+        values.</para>
+      
       <para><programlisting>hbase(main):003:0&gt; create 'test', 'cf'
 0 row(s) in 1.2200 seconds
 hbase(main):003:0&gt; list 'test'
@@ -179,59 +178,59 @@ hbase(main):005:0&gt; put 'test', 'row2', 'cf:b', 'value2'
 0 row(s) in 0.0370 seconds
 hbase(main):006:0&gt; put 'test', 'row3', 'cf:c', 'value3'
 0 row(s) in 0.0450 seconds</programlisting></para>
-
+      
       <para>Above we inserted 3 values, one at a time. The first insert is at
-      <varname>row1</varname>, column <varname>cf:a</varname> with a value of
-      <varname>value1</varname>. Columns in HBase are comprised of a column family prefix --
-      <varname>cf</varname> in this example -- followed by a colon and then a
-      column qualifier suffix (<varname>a</varname> in this case).</para>
-
+        <varname>row1</varname>, column <varname>cf:a</varname> with a value of
+        <varname>value1</varname>. Columns in HBase are comprised of a column family prefix --
+        <varname>cf</varname> in this example -- followed by a colon and then a
+        column qualifier suffix (<varname>a</varname> in this case).</para>
+      
       <para>Verify the data insert by running a scan of the table as follows</para>
-
+      
       <para><programlisting>hbase(main):007:0&gt; scan 'test'
 ROW        COLUMN+CELL
 row1       column=cf:a, timestamp=1288380727188, value=value1
 row2       column=cf:b, timestamp=1288380738440, value=value2
 row3       column=cf:c, timestamp=1288380747365, value=value3
 3 row(s) in 0.0590 seconds</programlisting></para>
-
+      
       <para>Get a single row</para>
-
+      
       <para><programlisting>hbase(main):008:0&gt; get 'test', 'row1'
 COLUMN      CELL
 cf:a        timestamp=1288380727188, value=value1
 1 row(s) in 0.0400 seconds</programlisting></para>
-
+      
       <para>Now, disable and drop your table. This will clean up all done
-      above.</para>
-
+        above.</para>
+      
       <para><programlisting>hbase(main):012:0&gt; disable 'test'
 0 row(s) in 1.0930 seconds
 hbase(main):013:0&gt; drop 'test'
 0 row(s) in 0.0770 seconds </programlisting></para>
-
+      
       <para>Exit the shell by typing exit.</para>
-
+      
       <para><programlisting>hbase(main):014:0&gt; exit</programlisting></para>
     </section>
-
+    
     <section xml:id="stopping">
       <title>Stopping HBase</title>
-
+      
       <para>Stop your hbase instance by running the stop script.</para>
-
+      
       <para><programlisting>$ ./bin/stop-hbase.sh
 stopping hbase...............</programlisting></para>
     </section>
-
+    
     <section>
       <title>Where to go next</title>
-
+      
       <para>The above described standalone setup is good for testing and
-          experiments only. In the next chapter, <xref linkend="configuration" />,
-      we'll go into depth on the different HBase run modes, system requirements
-      running HBase, and critical configurations setting up a distributed HBase deploy.</para>
+        experiments only. In the next chapter, <xref linkend="configuration" />,
+        we'll go into depth on the different HBase run modes, system requirements
+        running HBase, and critical configurations setting up a distributed HBase deploy.</para>
     </section>
   </section>
-
+  
 </chapter>
diff --git a/src/main/docbkx/ops_mgt.xml b/src/main/docbkx/ops_mgt.xml
index dbd6d17bf37..7b2cd63298f 100644
--- a/src/main/docbkx/ops_mgt.xml
+++ b/src/main/docbkx/ops_mgt.xml
@@ -1,13 +1,9 @@
 <?xml version="1.0" encoding="UTF-8"?>
-<chapter version="5.0" xml:id="ops_mgt"
-         xmlns="http://docbook.org/ns/docbook"
-         xmlns:xlink="http://www.w3.org/1999/xlink"
-         xmlns:xi="http://www.w3.org/2001/XInclude"
-         xmlns:svg="http://www.w3.org/2000/svg"
-         xmlns:m="http://www.w3.org/1998/Math/MathML"
-         xmlns:html="http://www.w3.org/1999/xhtml"
-         xmlns:db="http://docbook.org/ns/docbook">
-<!--
+<chapter version="5.0" xml:id="ops_mgt" xmlns="http://docbook.org/ns/docbook"
+  xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xi="http://www.w3.org/2001/XInclude"
+  xmlns:svg="http://www.w3.org/2000/svg" xmlns:m="http://www.w3.org/1998/Math/MathML"
+  xmlns:html="http://www.w3.org/1999/xhtml" xmlns:db="http://docbook.org/ns/docbook">
+  <!--
 /**
  * Licensed to the Apache Software Foundation (ASF) under one
  * or more contributor license agreements.  See the NOTICE file
@@ -27,20 +23,23 @@
  */
 -->
   <title>Apache HBase Operational Management</title>
-  This chapter will cover operational tools and practices required of a running Apache HBase cluster.
-  The subject of operations is related to the topics of <xref linkend="trouble" />, <xref linkend="performance"/>,
-  and <xref linkend="configuration" /> but is a distinct topic in itself.
+  <para> This chapter will cover operational tools and practices required of a running Apache HBase
+    cluster. The subject of operations is related to the topics of <xref linkend="trouble"/>, <xref
+      linkend="performance"/>, and <xref linkend="configuration"/> but is a distinct topic in
+    itself. </para>
 
   <section xml:id="tools">
-    <title >HBase Tools and Utilities</title>
+    <title>HBase Tools and Utilities</title>
 
     <para>Here we list HBase tools for administration, analysis, fixup, and debugging.</para>
-    <section xml:id="canary"><title>Canary</title>
-<para>There is a Canary class can help users to canary-test the HBase cluster status, with every
-        column-family for every regions or regionservers granularity. To see the usage,
-        <programlisting>$ ${HBASE_HOME}/bin/hbase org.apache.hadoop.hbase.tool.Canary -help</programlisting>
-        Will output
-        <programlisting>Usage: bin/hbase org.apache.hadoop.hbase.tool.Canary [opts] [table1 [table2]...] | [regionserver1 [regionserver2]..]
+    <section xml:id="canary">
+      <title>Canary</title>
+      <para> There is a Canary class can help users to canary-test the HBase cluster status, with
+        every column-family for every regions or regionservers granularity. To see the usage, use
+        the <literal>--help</literal> parameter. </para>
+      <screen>$ ${HBASE_HOME}/bin/hbase org.apache.hadoop.hbase.tool.Canary -help
+
+Usage: bin/hbase org.apache.hadoop.hbase.tool.Canary [opts] [table1 [table2]...] | [regionserver1 [regionserver2]..]
  where [opts] are:
    -help          Show this help and exit.
    -regionserver  replace the table argument to regionserver,
@@ -50,51 +49,54 @@
    -e             Use region/regionserver as regular expression
       which means the region/regionserver is regular expression pattern
    -f &lt;B>         stop whole program if first error occurs, default is true
-   -t &lt;N>         timeout for a check, default is 600000 (milliseconds)</programlisting>
-        This tool will return non zero error codes to user for collaborating with other monitoring
-        tools, such as Nagios. The error code definitions are...
-        <programlisting>private static final int USAGE_EXIT_CODE = 1;
+   -t &lt;N>         timeout for a check, default is 600000 (milliseconds)</screen>
+      <para> This tool will return non zero error codes to user for collaborating with other
+        monitoring tools, such as Nagios. The error code definitions are: </para>
+      <programlisting>private static final int USAGE_EXIT_CODE = 1;
 private static final int INIT_ERROR_EXIT_CODE = 2;
 private static final int TIMEOUT_ERROR_EXIT_CODE = 3;
 private static final int ERROR_EXIT_CODE = 4;</programlisting>
-        Here are some examples based on the following given case. There are two HTable called
+      <para> Here are some examples based on the following given case. There are two HTable called
         test-01 and test-02, they have two column family cf1 and cf2 respectively, and deployed on
-        the 3 regionservers. see following table. <table>
-          <tgroup cols="3" align="center" colsep="1" rowsep="1">
-            <colspec colname="regionserver" align="center"/>
-            <colspec colname="test-01" align="center"/>
-            <colspec colname="test-02" align="center"/>
-            <thead>
-              <row>
-                <entry>RegionServer</entry>
-                <entry>test-01</entry>
-                <entry>test-02</entry>
-              </row>
-            </thead>
-            <tbody>
-              <row>
-                <entry>rs1</entry>
-                <entry>r1</entry>
-                <entry>r2</entry>
-              </row>
-              <row>
-                <entry>rs2</entry>
-                <entry>r2</entry>
-                <entry/>
-              </row>
-              <row>
-                <entry>rs3</entry>
-                <entry>r2</entry>
-                <entry>r1</entry>
-              </row>
-            </tbody>
-          </tgroup>
-        </table> Following are some examples based on the previous given case. </para>
-<section><title>Canary test for every column family (store) of every region of every table</title>
-<para>
-<programlisting>$ ${HBASE_HOME}/bin/hbase org.apache.hadoop.hbase.tool.Canary</programlisting>
-The output log is...
-<programlisting>13/12/09 03:26:32 INFO tool.Canary: read from region test-01,,1386230156732.0e3c7d77ffb6361ea1b996ac1042ca9a. column family cf1 in 2ms
+        the 3 regionservers. see following table. </para>
+
+      <informaltable>
+        <tgroup cols="3" align="center" colsep="1" rowsep="1">
+          <colspec colname="regionserver" align="center"/>
+          <colspec colname="test-01" align="center"/>
+          <colspec colname="test-02" align="center"/>
+          <thead>
+            <row>
+              <entry>RegionServer</entry>
+              <entry>test-01</entry>
+              <entry>test-02</entry>
+            </row>
+          </thead>
+          <tbody>
+            <row>
+              <entry>rs1</entry>
+              <entry>r1</entry>
+              <entry>r2</entry>
+            </row>
+            <row>
+              <entry>rs2</entry>
+              <entry>r2</entry>
+              <entry/>
+            </row>
+            <row>
+              <entry>rs3</entry>
+              <entry>r2</entry>
+              <entry>r1</entry>
+            </row>
+          </tbody>
+        </tgroup>
+      </informaltable>
+      <para> Following are some examples based on the previous given case. </para>
+      <section>
+        <title>Canary test for every column family (store) of every region of every table</title>
+        <programlisting>$ ${HBASE_HOME}/bin/hbase org.apache.hadoop.hbase.tool.Canary
+            
+3/12/09 03:26:32 INFO tool.Canary: read from region test-01,,1386230156732.0e3c7d77ffb6361ea1b996ac1042ca9a. column family cf1 in 2ms
 13/12/09 03:26:32 INFO tool.Canary: read from region test-01,,1386230156732.0e3c7d77ffb6361ea1b996ac1042ca9a. column family cf2 in 2ms
 13/12/09 03:26:32 INFO tool.Canary: read from region test-01,0004883,1386230156732.87b55e03dfeade00f441125159f8ca87. column family cf1 in 4ms
 13/12/09 03:26:32 INFO tool.Canary: read from region test-01,0004883,1386230156732.87b55e03dfeade00f441125159f8ca87. column family cf2 in 1ms
@@ -104,64 +106,70 @@ The output log is...
 13/12/09 03:26:32 INFO tool.Canary: read from region test-02,0004883,1386559511167.cbda32d5e2e276520712d84eaaa29d84. column family cf1 in 31ms
 13/12/09 03:26:32 INFO tool.Canary: read from region test-02,0004883,1386559511167.cbda32d5e2e276520712d84eaaa29d84. column family cf2 in 8ms
 </programlisting>
-So you can see, table test-01 has two regions and two column families, so the Canary tool will pick 4 small piece of data from 4 (2 region * 2 store) different stores. This is a default behavior of the this tool does.
-</para>
-    </section>
+        <para> So you can see, table test-01 has two regions and two column families, so the Canary
+          tool will pick 4 small piece of data from 4 (2 region * 2 store) different stores. This is
+          a default behavior of the this tool does. </para>
+      </section>
 
-<section><title>Canary test for every column family (store) of every region of specific table(s)</title>
-<para>
-You can also test one or more specific tables.
-<programlisting>$ ${HBASE_HOME}/bin/hbase orghapache.hadoop.hbase.tool.Canary test-01 test-02</programlisting>
-</para>
-    </section>
+      <section>
+        <title>Canary test for every column family (store) of every region of specific
+          table(s)</title>
+        <para> You can also test one or more specific tables.</para>
+        <programlisting>$ ${HBASE_HOME}/bin/hbase orghapache.hadoop.hbase.tool.Canary test-01 test-02</programlisting>
+      </section>
 
-<section><title>Canary test with regionserver granularity</title>
-<para>
-This will pick one small piece of data from each regionserver, and can also put your resionserver name as input options for canary-test specific regionservers.
-<programlisting>$ ${HBASE_HOME}/bin/hbase org.apache.hadoop.hbase.tool.Canary -regionserver</programlisting>
-The output log is...
-<programlisting>13/12/09 06:05:17 INFO tool.Canary: Read from table:test-01 on region server:rs2 in 72ms
+      <section>
+        <title>Canary test with regionserver granularity</title>
+        <para> This will pick one small piece of data from each regionserver, and can also put your
+          resionserver name as input options for canary-test specific regionservers.</para>
+        <programlisting>$ ${HBASE_HOME}/bin/hbase org.apache.hadoop.hbase.tool.Canary -regionserver
+            
+13/12/09 06:05:17 INFO tool.Canary: Read from table:test-01 on region server:rs2 in 72ms
 13/12/09 06:05:17 INFO tool.Canary: Read from table:test-02 on region server:rs3 in 34ms
 13/12/09 06:05:17 INFO tool.Canary: Read from table:test-01 on region server:rs1 in 56ms</programlisting>
-</para>
-    </section>
-<section><title>Canary test with regular expression pattern</title>
-<para>
-This will test both table test-01 and test-02.
-<programlisting>$ ${HBASE_HOME}/bin/hbase orghapache.hadoop.hbase.tool.Canary -e test-0[1-2]</programlisting>
-</para>
-    </section>
+      </section>
+      <section>
+        <title>Canary test with regular expression pattern</title>
+        <para> This will test both table test-01 and test-02.</para>
+        <programlisting>$ ${HBASE_HOME}/bin/hbase orghapache.hadoop.hbase.tool.Canary -e test-0[1-2]</programlisting>
+      </section>
 
-<section><title>Run canary test as daemon mode</title>
-<para>
-Run repeatedly with interval defined in option -interval whose default value is 6 seconds. This daemon will stop itself and return non-zero error code if any error occurs, due to the default value of option -f is true.
-<programlisting>$ ${HBASE_HOME}/bin/hbase orghapache.hadoop.hbase.tool.Canary -daemon</programlisting>
-Run repeatedly with internal 5 seconds and will not stop itself even error occurs in the test.
-<programlisting>$ ${HBASE_HOME}/bin/hbase orghapache.hadoop.hbase.tool.Canary -daemon -interval 50000 -f false</programlisting>
-</para>
-    </section>
+      <section>
+        <title>Run canary test as daemon mode</title>
+        <para> Run repeatedly with interval defined in option -interval whose default value is 6
+          seconds. This daemon will stop itself and return non-zero error code if any error occurs,
+          due to the default value of option -f is true.</para>
+        <programlisting>$ ${HBASE_HOME}/bin/hbase orghapache.hadoop.hbase.tool.Canary -daemon</programlisting>
+        <para>Run repeatedly with internal 5 seconds and will not stop itself even error occurs in
+          the test.</para>
+        <programlisting>$ ${HBASE_HOME}/bin/hbase orghapache.hadoop.hbase.tool.Canary -daemon -interval 50000 -f false</programlisting>
+      </section>
 
-<section><title>Force timeout if canary test stuck</title>
-<para>In some cases, we suffered the request stucked on the regionserver and not response back to the client. The regionserver in problem, would also not indicated to be dead by Master, which would bring the clients hung. So we provide the timeout option to kill the canary test forcefully and return non-zero error code as well.
-This run sets the timeout value to 60 seconds, the default value is 600 seconds.
-<programlisting>$ ${HBASE_HOME}/bin/hbase orghapache.hadoop.hbase.tool.Canary -t 600000</programlisting>
-</para>
-    </section>
+      <section>
+        <title>Force timeout if canary test stuck</title>
+        <para>In some cases, we suffered the request stucked on the regionserver and not response
+          back to the client. The regionserver in problem, would also not indicated to be dead by
+          Master, which would bring the clients hung. So we provide the timeout option to kill the
+          canary test forcefully and return non-zero error code as well. This run sets the timeout
+          value to 60 seconds, the default value is 600 seconds.</para>
+        <programlisting>$ ${HBASE_HOME}/bin/hbase orghapache.hadoop.hbase.tool.Canary -t 600000</programlisting>
+      </section>
 
     </section>
 
-    <section xml:id="health.check"><title>Health Checker</title>
-        <para>You can configure HBase to run a script on a period and if it fails N times (configurable), have the server exit.
-            See <link xlink:ref="">HBASE-7351 Periodic health check script</link> for configurations and detail.
-        </para>
+    <section xml:id="health.check">
+      <title>Health Checker</title>
+      <para>You can configure HBase to run a script on a period and if it fails N times
+        (configurable), have the server exit. See <link xlink:href="">HBASE-7351 Periodic health
+          check script</link> for configurations and detail. </para>
     </section>
 
-    <section xml:id="driver"><title>Driver</title>
-      <para>There is a <code>Driver</code> class that is executed by the HBase jar can be used to invoke frequently accessed utilities.  For example,
-<programlisting>HADOOP_CLASSPATH=`${HBASE_HOME}/bin/hbase classpath` ${HADOOP_HOME}/bin/hadoop jar ${HBASE_HOME}/hbase-VERSION.jar
-</programlisting>
-... will return...
-<programlisting>
+    <section xml:id="driver">
+      <title>Driver</title>
+      <para>There is a <code>Driver</code> class that is executed by the HBase jar can be used to
+        invoke frequently accessed utilities. For example,</para>
+      <programlisting>HADOOP_CLASSPATH=`${HBASE_HOME}/bin/hbase classpath` ${HADOOP_HOME}/bin/hadoop jar ${HBASE_HOME}/hbase-VERSION.jar
+
 An example program must be given as the first argument.
 Valid program names are:
   completebulkload: Complete a bulk data load.
@@ -172,28 +180,23 @@ Valid program names are:
   rowcounter: Count rows in HBase table
   verifyrep: Compare the data from tables in two different clusters. WARNING: It doesn't work for incrementColumnValues'd cells since the timestamp is chan
 </programlisting>
-... for allowable program names.
-      </para>
     </section>
     <section xml:id="hbck">
-        <title>HBase <application>hbck</application></title>
-        <subtitle>An <emphasis>fsck</emphasis> for your HBase install</subtitle>
-        <para>To run <application>hbck</application> against your HBase cluster run
-        <programlisting>$ ./bin/hbase hbck</programlisting>
-        At the end of the commands output it prints <emphasis>OK</emphasis>
-        or <emphasis>INCONSISTENCY</emphasis>. If your cluster reports
-        inconsistencies, pass <command>-details</command> to see more detail emitted.
-        If inconsistencies, run <command>hbck</command> a few times because the
-        inconsistency may be transient (e.g. cluster is starting up or a region is
-        splitting).
-        Passing <command>-fix</command> may correct the inconsistency (This latter
-        is an experimental feature).
-        </para>
-        <para>For more information, see <xref linkend="hbck.in.depth"/>.
-        </para>
+      <title>HBase <application>hbck</application></title>
+      <subtitle>An <command>fsck</command> for your HBase install</subtitle>
+      <para>To run <application>hbck</application> against your HBase cluster run <command>$
+          ./bin/hbase hbck</command> At the end of the command's output it prints
+        <screen>OK</screen> or <screen>INCONSISTENCY</screen>. If your cluster reports
+        inconsistencies, pass <command>-details</command> to see more detail emitted. If
+        inconsistencies, run <command>hbck</command> a few times because the inconsistency may be
+        transient (e.g. cluster is starting up or a region is splitting). Passing
+          <command>-fix</command> may correct the inconsistency (This latter is an experimental
+        feature). </para>
+      <para>For more information, see <xref linkend="hbck.in.depth"/>. </para>
     </section>
-    <section xml:id="hfile_tool2"><title>HFile Tool</title>
-        <para>See <xref linkend="hfile_tool" />.</para>
+    <section xml:id="hfile_tool2">
+      <title>HFile Tool</title>
+      <para>See <xref linkend="hfile_tool"/>.</para>
     </section>
     <section xml:id="wal_tools">
       <title>WAL Tools</title>
@@ -201,109 +204,132 @@ Valid program names are:
       <section xml:id="hlog_tool">
         <title><classname>FSHLog</classname> tool</title>
 
-        <para>The main method on <classname>FSHLog</classname> offers manual
-        split and dump facilities. Pass it WALs or the product of a split, the
-        content of the <filename>recovered.edits</filename>. directory.</para>
+        <para>The main method on <classname>FSHLog</classname> offers manual split and dump
+          facilities. Pass it WALs or the product of a split, the content of the
+            <filename>recovered.edits</filename>. directory.</para>
 
         <para>You can get a textual dump of a WAL file content by doing the
-        following:<programlisting> <code>$ ./bin/hbase org.apache.hadoop.hbase.regionserver.wal.FSHLog --dump hdfs://example.org:8020/hbase/.logs/example.org,60020,1283516293161/10.10.21.10%3A60020.1283973724012</code> </programlisting>The
-        return code will be non-zero if issues with the file so you can test
-        wholesomeness of file by redirecting <varname>STDOUT</varname> to
-        <code>/dev/null</code> and testing the program return.</para>
+          following:<programlisting> <code>$ ./bin/hbase org.apache.hadoop.hbase.regionserver.wal.FSHLog --dump hdfs://example.org:8020/hbase/.logs/example.org,60020,1283516293161/10.10.21.10%3A60020.1283973724012</code> </programlisting>The
+          return code will be non-zero if issues with the file so you can test wholesomeness of file
+          by redirecting <varname>STDOUT</varname> to <code>/dev/null</code> and testing the program
+          return.</para>
 
         <para>Similarly you can force a split of a log file directory by
-        doing:<programlisting> $ ./<code>bin/hbase org.apache.hadoop.hbase.regionserver.wal.FSHLog --split hdfs://example.org:8020/hbase/.logs/example.org,60020,1283516293161/</code></programlisting></para>
+          doing:<programlisting> $ ./<code>bin/hbase org.apache.hadoop.hbase.regionserver.wal.FSHLog --split hdfs://example.org:8020/hbase/.logs/example.org,60020,1283516293161/</code></programlisting></para>
 
         <section xml:id="hlog_tool.prettyprint">
           <title><classname>HLogPrettyPrinter</classname></title>
-          <para><classname>HLogPrettyPrinter</classname> is a tool with configurable options to print the contents of an HLog.
-          </para>
+          <para><classname>HLogPrettyPrinter</classname> is a tool with configurable options to
+            print the contents of an HLog. </para>
         </section>
 
       </section>
     </section>
-    <section xml:id="compression.tool"><title>Compression Tool</title>
-        <para>See <xref linkend="compression.test" />.</para>
+    <section xml:id="compression.tool">
+      <title>Compression Tool</title>
+      <para>See <xref linkend="compression.test"/>.</para>
     </section>
-        <section xml:id="copytable">
-        <title>CopyTable</title>
-      <para>
-          CopyTable is a utility that can copy part or of all of a table, either to the same cluster or another cluster. The target table must
-          first exist. The usage is as follows:
-<programlisting>$ bin/hbase org.apache.hadoop.hbase.mapreduce.CopyTable [--starttime=X] [--endtime=Y] [--new.name=NEW] [--peer.adr=ADR] tablename
+    <section xml:id="copytable">
+      <title>CopyTable</title>
+      <para> CopyTable is a utility that can copy part or of all of a table, either to the same
+        cluster or another cluster. The target table must first exist. The usage is as
+        follows:</para>
+      <programlisting>$ bin/hbase org.apache.hadoop.hbase.mapreduce.CopyTable [--starttime=X] [--endtime=Y] [--new.name=NEW] [--peer.adr=ADR] tablename
 </programlisting>
-        </para>
-        <para>
-        Options:
-        <itemizedlist>
-          <listitem><varname>starttime</varname>  Beginning of the time range.  Without endtime means starttime to forever.</listitem>
-          <listitem><varname>endtime</varname>  End of the time range.  Without endtime means starttime to forever.</listitem>
-          <listitem><varname>versions</varname>  Number of cell versions to copy.</listitem>
-          <listitem><varname>new.name</varname>  New table's name.</listitem>
-          <listitem><varname>peer.adr</varname>  Address of the peer cluster given in the format hbase.zookeeper.quorum:hbase.zookeeper.client.port:zookeeper.znode.parent</listitem>
-          <listitem><varname>families</varname>  Comma-separated list of ColumnFamilies to copy.</listitem>
-          <listitem><varname>all.cells</varname>  Also copy delete markers and uncollected deleted cells (advanced option).</listitem>
-        </itemizedlist>
-         Args:
-        <itemizedlist>
-          <listitem>tablename  Name of table to copy.</listitem>
-        </itemizedlist>
-        </para>
-        <para>Example of copying 'TestTable' to a cluster that uses replication for a 1 hour window:
-<programlisting>$ bin/hbase org.apache.hadoop.hbase.mapreduce.CopyTable
+
+      <itemizedlist>
+        <title>Options</title>
+        <listitem>
+          <para><varname>starttime</varname> Beginning of the time range. Without endtime means
+            starttime to forever.</para>
+        </listitem>
+        <listitem>
+          <para><varname>endtime</varname> End of the time range. Without endtime means starttime to
+            forever.</para>
+        </listitem>
+        <listitem>
+          <para><varname>versions</varname> Number of cell versions to copy.</para>
+        </listitem>
+        <listitem>
+          <para><varname>new.name</varname> New table's name.</para>
+        </listitem>
+        <listitem>
+          <para><varname>peer.adr</varname> Address of the peer cluster given in the format
+            hbase.zookeeper.quorum:hbase.zookeeper.client.port:zookeeper.znode.parent</para>
+        </listitem>
+        <listitem>
+          <para><varname>families</varname> Comma-separated list of ColumnFamilies to copy.</para>
+        </listitem>
+        <listitem>
+          <para><varname>all.cells</varname> Also copy delete markers and uncollected deleted cells
+            (advanced option).</para>
+        </listitem>
+      </itemizedlist>
+      <itemizedlist>
+        <title>Args:</title>
+        <listitem>
+          <para>tablename Name of table to copy.</para>
+        </listitem>
+      </itemizedlist>
+      <para>Example of copying 'TestTable' to a cluster that uses replication for a 1 hour
+        window:</para>
+      <programlisting>$ bin/hbase org.apache.hadoop.hbase.mapreduce.CopyTable
 --starttime=1265875194289 --endtime=1265878794289
 --peer.adr=server1,server2,server3:2181:/hbase TestTable</programlisting>
-        </para>
-        <note><title>Scanner Caching</title>
-        <para>Caching for the input Scan is configured via <code>hbase.client.scanner.caching</code> in the job configuration.
-        </para>
-	</note>
-	<note><title>Versions</title>
-        <para>By default, CopyTable utility only copies the latest version of row cells unless <code>--versions=n</code> is explicitly specified in the command.
-        </para>
-        </note>
-        <para>
-        See Jonathan Hsieh's <link xlink:href="http://www.cloudera.com/blog/2012/06/online-hbase-backups-with-copytable-2/">Online HBase Backups with CopyTable</link> blog post for more on <command>CopyTable</command>.
-        </para>
+      <note>
+        <title>Scanner Caching</title>
+        <para>Caching for the input Scan is configured via <code>hbase.client.scanner.caching</code>
+          in the job configuration. </para>
+      </note>
+      <note>
+        <title>Versions</title>
+        <para>By default, CopyTable utility only copies the latest version of row cells unless
+            <code>--versions=n</code> is explicitly specified in the command. </para>
+      </note>
+      <para> See Jonathan Hsieh's <link
+          xlink:href="http://www.cloudera.com/blog/2012/06/online-hbase-backups-with-copytable-2/"
+          >Online HBase Backups with CopyTable</link> blog post for more on
+          <command>CopyTable</command>. </para>
     </section>
     <section xml:id="export">
-       <title>Export</title>
-       <para>Export is a utility that will dump the contents of table to HDFS in a sequence file.  Invoke via:
-<programlisting>$ bin/hbase org.apache.hadoop.hbase.mapreduce.Export &lt;tablename&gt; &lt;outputdir&gt; [&lt;versions&gt; [&lt;starttime&gt; [&lt;endtime&gt;]]]
+      <title>Export</title>
+      <para>Export is a utility that will dump the contents of table to HDFS in a sequence file.
+        Invoke via:</para>
+      <programlisting>$ bin/hbase org.apache.hadoop.hbase.mapreduce.Export &lt;tablename&gt; &lt;outputdir&gt; [&lt;versions&gt; [&lt;starttime&gt; [&lt;endtime&gt;]]]
 </programlisting>
-       </para>
-        <para>Note:  caching for the input Scan is configured via <code>hbase.client.scanner.caching</code> in the job configuration.
-        </para>
+
+      <para>Note: caching for the input Scan is configured via
+          <code>hbase.client.scanner.caching</code> in the job configuration. </para>
     </section>
     <section xml:id="import">
-       <title>Import</title>
-       <para>Import is a utility that will load data that has been exported back into HBase.  Invoke via:
-<programlisting>$ bin/hbase org.apache.hadoop.hbase.mapreduce.Import &lt;tablename&gt; &lt;inputdir&gt;
+      <title>Import</title>
+      <para>Import is a utility that will load data that has been exported back into HBase. Invoke
+        via:</para>
+      <programlisting>$ bin/hbase org.apache.hadoop.hbase.mapreduce.Import &lt;tablename&gt; &lt;inputdir&gt;
 </programlisting>
-       </para>
-       <para>To import 0.94 exported files in a 0.96 cluster or onwards, you need to set system property "hbase.import.version" when running the import command as below:
-<programlisting>$ bin/hbase -Dhbase.import.version=0.94 org.apache.hadoop.hbase.mapreduce.Import &lt;tablename&gt; &lt;inputdir&gt;
+      <para>To import 0.94 exported files in a 0.96 cluster or onwards, you need to set system
+        property "hbase.import.version" when running the import command as below:</para>
+      <programlisting>$ bin/hbase -Dhbase.import.version=0.94 org.apache.hadoop.hbase.mapreduce.Import &lt;tablename&gt; &lt;inputdir&gt;
 </programlisting>
-       </para>
     </section>
     <section xml:id="importtsv">
-       <title>ImportTsv</title>
-       <para>ImportTsv is a utility that will load data in TSV format into HBase.  It has two distinct usages:  loading data from TSV format in HDFS
-       into HBase via Puts, and preparing StoreFiles to be loaded via the <code>completebulkload</code>.
-       </para>
-       <para>To load data via Puts (i.e., non-bulk loading):
-<programlisting>$ bin/hbase org.apache.hadoop.hbase.mapreduce.ImportTsv -Dimporttsv.columns=a,b,c &lt;tablename&gt; &lt;hdfs-inputdir&gt;
+      <title>ImportTsv</title>
+      <para>ImportTsv is a utility that will load data in TSV format into HBase. It has two distinct
+        usages: loading data from TSV format in HDFS into HBase via Puts, and preparing StoreFiles
+        to be loaded via the <code>completebulkload</code>. </para>
+      <para>To load data via Puts (i.e., non-bulk loading):</para>
+      <programlisting>$ bin/hbase org.apache.hadoop.hbase.mapreduce.ImportTsv -Dimporttsv.columns=a,b,c &lt;tablename&gt; &lt;hdfs-inputdir&gt;
 </programlisting>
-       </para>
-       <para>To generate StoreFiles for bulk-loading:
-<programlisting>$ bin/hbase org.apache.hadoop.hbase.mapreduce.ImportTsv -Dimporttsv.columns=a,b,c -Dimporttsv.bulk.output=hdfs://storefile-outputdir &lt;tablename&gt; &lt;hdfs-data-inputdir&gt;
+
+      <para>To generate StoreFiles for bulk-loading:</para>
+      <programlisting>$ bin/hbase org.apache.hadoop.hbase.mapreduce.ImportTsv -Dimporttsv.columns=a,b,c -Dimporttsv.bulk.output=hdfs://storefile-outputdir &lt;tablename&gt; &lt;hdfs-data-inputdir&gt;
 </programlisting>
-       </para>
-       <para>These generated StoreFiles can be loaded into HBase via <xref linkend="completebulkload"/>.
-       </para>
-       <section xml:id="importtsv.options"><title>ImportTsv Options</title>
-       Running ImportTsv with no arguments prints brief usage information:
-<programlisting>
+      <para>These generated StoreFiles can be loaded into HBase via <xref linkend="completebulkload"
+        />. </para>
+      <section xml:id="importtsv.options">
+        <title>ImportTsv Options</title>
+        <para>Running ImportTsv with no arguments prints brief usage information:</para>
+        <programlisting>
 Usage: importtsv -Dimporttsv.columns=a,b,c &lt;tablename&gt; &lt;inputdir&gt;
 
 Imports the given input directory of TSV data into the specified table.
@@ -327,12 +353,13 @@ Other options that may be specified with -D include:
   -Dimporttsv.timestamp=currentTimeAsLong - use the specified timestamp for the import
   -Dimporttsv.mapper.class=my.Mapper - A user-defined Mapper to use instead of org.apache.hadoop.hbase.mapreduce.TsvImporterMapper
 </programlisting>
-       </section>
-       <section xml:id="importtsv.example"><title>ImportTsv Example</title>
-         <para>For example, assume that we are loading data into a table called 'datatsv' with a ColumnFamily called 'd' with two columns "c1" and "c2".
-         </para>
-         <para>Assume that an input file exists as follows:
-<programlisting>
+      </section>
+      <section xml:id="importtsv.example">
+        <title>ImportTsv Example</title>
+        <para>For example, assume that we are loading data into a table called 'datatsv' with a
+          ColumnFamily called 'd' with two columns "c1" and "c2". </para>
+        <para>Assume that an input file exists as follows:
+          <programlisting>
 row1	c1	c2
 row2	c1	c2
 row3	c1	c2
@@ -344,171 +371,187 @@ row8	c1	c2
 row9	c1	c2
 row10	c1	c2
 </programlisting>
-         </para>
-         <para>For ImportTsv to use this imput file, the command line needs to look like this:
- <programlisting>
+        </para>
+        <para>For ImportTsv to use this imput file, the command line needs to look like this:</para>
+        <programlisting>
  HADOOP_CLASSPATH=`${HBASE_HOME}/bin/hbase classpath` ${HADOOP_HOME}/bin/hadoop jar ${HBASE_HOME}/hbase-VERSION.jar importtsv -Dimporttsv.columns=HBASE_ROW_KEY,d:c1,d:c2 -Dimporttsv.bulk.output=hdfs://storefileoutput datatsv hdfs://inputfile
  </programlisting>
-         ... and in this example the first column is the rowkey, which is why the HBASE_ROW_KEY is used.  The second and third columns in the file will be imported as "d:c1" and "d:c2", respectively.
-         </para>
-       </section>
-       <section xml:id="importtsv.warning"><title>ImportTsv Warning</title>
-         <para>If you have preparing a lot of data for bulk loading, make sure the target HBase table is pre-split appropriately.
-         </para>
-       </section>
-       <section xml:id="importtsv.also"><title>See Also</title>
-       For more information about bulk-loading HFiles into HBase, see <xref linkend="arch.bulk.load"/>
-       </section>
+        <para> ... and in this example the first column is the rowkey, which is why the
+          HBASE_ROW_KEY is used. The second and third columns in the file will be imported as "d:c1"
+          and "d:c2", respectively. </para>
+      </section>
+      <section xml:id="importtsv.warning">
+        <title>ImportTsv Warning</title>
+        <para>If you have preparing a lot of data for bulk loading, make sure the target HBase table
+          is pre-split appropriately. </para>
+      </section>
+      <section xml:id="importtsv.also">
+        <title>See Also</title>
+        <para>For more information about bulk-loading HFiles into HBase, see <xref
+            linkend="arch.bulk.load"/></para>
+      </section>
     </section>
 
     <section xml:id="completebulkload">
-       <title>CompleteBulkLoad</title>
-	   <para>The <code>completebulkload</code> utility will move generated StoreFiles into an HBase table.  This utility is often used
-	   in conjunction with output from <xref linkend="importtsv"/>.
-	   </para>
-	   <para>There are two ways to invoke this utility, with explicit classname and via the driver:
-<programlisting>$ bin/hbase org.apache.hadoop.hbase.mapreduce.LoadIncrementalHFiles &lt;hdfs://storefileoutput&gt; &lt;tablename&gt;
+      <title>CompleteBulkLoad</title>
+      <para>The <code>completebulkload</code> utility will move generated StoreFiles into an HBase
+        table. This utility is often used in conjunction with output from <xref linkend="importtsv"
+        />. </para>
+      <para>There are two ways to invoke this utility, with explicit classname and via the
+        driver:</para>
+      <programlisting>$ bin/hbase org.apache.hadoop.hbase.mapreduce.LoadIncrementalHFiles &lt;hdfs://storefileoutput&gt; &lt;tablename&gt;
 </programlisting>
-.. and via the Driver..
-<programlisting>HADOOP_CLASSPATH=`${HBASE_HOME}/bin/hbase classpath` ${HADOOP_HOME}/bin/hadoop jar ${HBASE_HOME}/hbase-VERSION.jar completebulkload &lt;hdfs://storefileoutput&gt; &lt;tablename&gt;
+      <para> .. and via the Driver..</para>
+      <programlisting>HADOOP_CLASSPATH=`${HBASE_HOME}/bin/hbase classpath` ${HADOOP_HOME}/bin/hadoop jar ${HBASE_HOME}/hbase-VERSION.jar completebulkload &lt;hdfs://storefileoutput&gt; &lt;tablename&gt;
 </programlisting>
-	  </para>
-          <section xml:id="completebulkload.warning"><title>CompleteBulkLoad Warning</title>
-          <para>Data generated via MapReduce is often created with file permissions that are not compatible with the running HBase process. Assuming you're running HDFS with permissions enabled, those permissions will need to be updated before you run CompleteBulkLoad.
-          </para>
-          </section>
-       <para>For more information about bulk-loading HFiles into HBase, see <xref linkend="arch.bulk.load"/>.
-       </para>
+      <section xml:id="completebulkload.warning">
+        <title>CompleteBulkLoad Warning</title>
+        <para>Data generated via MapReduce is often created with file permissions that are not
+          compatible with the running HBase process. Assuming you're running HDFS with permissions
+          enabled, those permissions will need to be updated before you run CompleteBulkLoad.</para>
+        <para>For more information about bulk-loading HFiles into HBase, see <xref
+            linkend="arch.bulk.load"/>. </para>
+      </section>
+
     </section>
     <section xml:id="walplayer">
-       <title>WALPlayer</title>
-       <para>WALPlayer is a utility to replay WAL files into HBase.
-       </para>
-       <para>The WAL can be replayed for a set of tables or all tables, and a
-           timerange can be provided (in milliseconds). The WAL is filtered to
-           this set of tables. The output can optionally be mapped to another set of tables.
-       </para>
-       <para>WALPlayer can also generate HFiles for later bulk importing, in that case
-           only a single table and no mapping can be specified.
-       </para>
-       <para>Invoke via:
-<programlisting>$ bin/hbase org.apache.hadoop.hbase.mapreduce.WALPlayer [options] &lt;wal inputdir&gt; &lt;tables&gt; [&lt;tableMappings>]&gt;
+      <title>WALPlayer</title>
+      <para>WALPlayer is a utility to replay WAL files into HBase. </para>
+      <para>The WAL can be replayed for a set of tables or all tables, and a timerange can be
+        provided (in milliseconds). The WAL is filtered to this set of tables. The output can
+        optionally be mapped to another set of tables. </para>
+      <para>WALPlayer can also generate HFiles for later bulk importing, in that case only a single
+        table and no mapping can be specified. </para>
+      <para>Invoke via:</para>
+      <programlisting>$ bin/hbase org.apache.hadoop.hbase.mapreduce.WALPlayer [options] &lt;wal inputdir&gt; &lt;tables&gt; [&lt;tableMappings>]&gt;
 </programlisting>
-       </para>
-       <para>For example:
-<programlisting>$ bin/hbase org.apache.hadoop.hbase.mapreduce.WALPlayer /backuplogdir oldTable1,oldTable2 newTable1,newTable2
+      <para>For example:</para>
+      <programlisting>$ bin/hbase org.apache.hadoop.hbase.mapreduce.WALPlayer /backuplogdir oldTable1,oldTable2 newTable1,newTable2
 </programlisting>
-       </para>
-       <para>
-           WALPlayer, by default, runs as a mapreduce job.  To NOT run WALPlayer as a mapreduce job on your cluster,
-           force it to run all in the local process by adding the flags <code>-Dmapreduce.jobtracker.address=local</code> on the command line.
-       </para>
+      <para> WALPlayer, by default, runs as a mapreduce job. To NOT run WALPlayer as a mapreduce job
+        on your cluster, force it to run all in the local process by adding the flags
+          <code>-Dmapreduce.jobtracker.address=local</code> on the command line. </para>
     </section>
     <section xml:id="rowcounter">
-       <title>RowCounter and CellCounter</title>
-       <para><ulink url="http://hbase.apache.org/apidocs/org/apache/hadoop/hbase/mapreduce/RowCounter.html">RowCounter</ulink> is a
-       mapreduce job to count all the rows of a table.  This is a good utility to use as a sanity check to ensure that HBase can read
-       all the blocks of a table if there are any concerns of metadata inconsistency. It will run the mapreduce all in a single
-       process but it will run faster if you have a MapReduce cluster in place for it to exploit.
-<programlisting>$ bin/hbase org.apache.hadoop.hbase.mapreduce.RowCounter &lt;tablename&gt; [&lt;column1&gt; &lt;column2&gt;...]
+      <title>RowCounter and CellCounter</title>
+      <para><link
+          xlink:href="http://hbase.apache.org/apidocs/org/apache/hadoop/hbase/mapreduce/RowCounter.html"
+          >RowCounter</link> is a mapreduce job to count all the rows of a table. This is a good
+        utility to use as a sanity check to ensure that HBase can read all the blocks of a table if
+        there are any concerns of metadata inconsistency. It will run the mapreduce all in a single
+        process but it will run faster if you have a MapReduce cluster in place for it to
+        exploit.</para>
+      <programlisting>$ bin/hbase org.apache.hadoop.hbase.mapreduce.RowCounter &lt;tablename&gt; [&lt;column1&gt; &lt;column2&gt;...]
 </programlisting>
-       </para>
-       <para>Note: caching for the input Scan is configured via <code>hbase.client.scanner.caching</code> in the job configuration.
-       </para>
-       <para>HBase ships another diagnostic mapreduce job called
-         <ulink url="http://hbase.apache.org/apidocs/org/apache/hadoop/hbase/mapreduce/CellCounter.html">CellCounter</ulink>. Like
-         RowCounter, it gathers more fine-grained statistics about your table. The statistics gathered by RowCounter are more fine-grained
-         and include:
-         <itemizedlist>
-           <listitem>Total number of rows in the table.</listitem>
-           <listitem>Total number of CFs across all rows.</listitem>
-           <listitem>Total qualifiers across all rows.</listitem>
-           <listitem>Total occurrence of each CF.</listitem>
-           <listitem>Total occurrence of each qualifier.</listitem>
-           <listitem>Total number of versions of each qualifier.</listitem>
-         </itemizedlist>
-       </para>
-       <para>The program allows you to limit the scope of the run. Provide a row regex or prefix to limit the rows to analyze. Use
-         <code>hbase.mapreduce.scan.column.family</code> to specify scanning a single column family.
-         <programlisting>$ bin/hbase org.apache.hadoop.hbase.mapreduce.CellCounter &lt;tablename&gt; &lt;outputDir&gt; [regex or prefix]</programlisting>
-       </para>
-       <para>Note: just like RowCounter, caching for the input Scan is configured via <code>hbase.client.scanner.caching</code> in the
-       job configuration. </para>
+      <para>Note: caching for the input Scan is configured via
+          <code>hbase.client.scanner.caching</code> in the job configuration. </para>
+      <para>HBase ships another diagnostic mapreduce job called <link
+          xlink:href="http://hbase.apache.org/apidocs/org/apache/hadoop/hbase/mapreduce/CellCounter.html"
+          >CellCounter</link>. Like RowCounter, it gathers more fine-grained statistics about your
+        table. The statistics gathered by RowCounter are more fine-grained and include: </para>
+      <itemizedlist>
+        <listitem>
+          <para>Total number of rows in the table.</para>
+        </listitem>
+        <listitem>
+          <para>Total number of CFs across all rows.</para>
+        </listitem>
+        <listitem>
+          <para>Total qualifiers across all rows.</para>
+        </listitem>
+        <listitem>
+          <para>Total occurrence of each CF.</para>
+        </listitem>
+        <listitem>
+          <para>Total occurrence of each qualifier.</para>
+        </listitem>
+        <listitem>
+          <para>Total number of versions of each qualifier.</para>
+        </listitem>
+      </itemizedlist>
+      <para>The program allows you to limit the scope of the run. Provide a row regex or prefix to
+        limit the rows to analyze. Use <code>hbase.mapreduce.scan.column.family</code> to specify
+        scanning a single column family.</para>
+      <programlisting>$ bin/hbase org.apache.hadoop.hbase.mapreduce.CellCounter &lt;tablename&gt; &lt;outputDir&gt; [regex or prefix]</programlisting>
+      <para>Note: just like RowCounter, caching for the input Scan is configured via
+          <code>hbase.client.scanner.caching</code> in the job configuration. </para>
     </section>
     <section xml:id="mlockall">
-        <title>mlockall</title>
-        <para>It is possible to optionally pin your servers in physical memory making them less likely
-            to be swapped out in oversubscribed environments by having the servers call
-            <link xlink:href="http://linux.die.net/man/2/mlockall">mlockall</link> on startup.
-            See <link xlink:href="https://issues.apache.org/jira/browse/HBASE-4391">HBASE-4391 Add ability to start RS as root and call mlockall</link>
-            for how to build the optional library and have it run on startup.
-        </para>
+      <title>mlockall</title>
+      <para>It is possible to optionally pin your servers in physical memory making them less likely
+        to be swapped out in oversubscribed environments by having the servers call <link
+          xlink:href="http://linux.die.net/man/2/mlockall">mlockall</link> on startup. See <link
+          xlink:href="https://issues.apache.org/jira/browse/HBASE-4391">HBASE-4391 Add ability to
+          start RS as root and call mlockall</link> for how to build the optional library and have
+        it run on startup. </para>
     </section>
     <section xml:id="compaction.tool">
-        <title>Offline Compaction Tool</title>
-        <para>See the usage for the <link xlink:href="http://hbase.apache.org/apidocs/org/apache/hadoop/hbase/regionserver/CompactionTool.html">Compaction Tool</link>.
-            Run it like this <command>./bin/hbase org.apache.hadoop.hbase.regionserver.CompactionTool</command>
-        </para>
+      <title>Offline Compaction Tool</title>
+      <para>See the usage for the <link
+          xlink:href="http://hbase.apache.org/apidocs/org/apache/hadoop/hbase/regionserver/CompactionTool.html"
+          >Compaction Tool</link>. Run it like this <command>./bin/hbase
+          org.apache.hadoop.hbase.regionserver.CompactionTool</command>
+      </para>
     </section>
 
-    </section>  <!--  tools -->
+  </section>
+  <!--  tools -->
 
   <section xml:id="ops.regionmgt">
     <title>Region Management</title>
     <section xml:id="ops.regionmgt.majorcompact">
       <title>Major Compaction</title>
-      <para>Major compactions can be requested via the HBase shell or <link xlink:href="http://hbase.apache.org/apidocs/org/apache/hadoop/hbase/client/HBaseAdmin.html#majorCompact%28java.lang.String%29">HBaseAdmin.majorCompact</link>.
-      </para>
-      <para>Note:  major compactions do NOT do region merges.  See <xref linkend="compaction"/> for more information about compactions.
-
-      </para>
+      <para>Major compactions can be requested via the HBase shell or <link
+          xlink:href="http://hbase.apache.org/apidocs/org/apache/hadoop/hbase/client/HBaseAdmin.html#majorCompact%28java.lang.String%29"
+          >HBaseAdmin.majorCompact</link>. </para>
+      <para>Note: major compactions do NOT do region merges. See <xref linkend="compaction"/> for
+        more information about compactions. </para>
     </section>
     <section xml:id="ops.regionmgt.merge">
       <title>Merge</title>
-      <para>Merge is a utility that can merge adjoining regions in the same table (see org.apache.hadoop.hbase.util.Merge).</para>
-<programlisting>$ bin/hbase org.apache.hadoop.hbase.util.Merge &lt;tablename&gt; &lt;region1&gt; &lt;region2&gt;
+      <para>Merge is a utility that can merge adjoining regions in the same table (see
+        org.apache.hadoop.hbase.util.Merge).</para>
+      <programlisting>$ bin/hbase org.apache.hadoop.hbase.util.Merge &lt;tablename&gt; &lt;region1&gt; &lt;region2&gt;
 </programlisting>
-      <para>If you feel you have too many regions and want to consolidate them, Merge is the utility you need.  Merge must
-      run be done when the cluster is down.
-      See the <link xlink:href="http://ofps.oreilly.com/titles/9781449396107/performance.html">O'Reilly HBase Book</link> for
-      an example of usage.
-      </para>
-      <para>You will need to pass 3 parameters to this application. The first one is the table name. The second one is the fully
-      qualified name of the first region to merge, like "table_name,\x0A,1342956111995.7cef47f192318ba7ccc75b1bbf27a82b.". The third one
-      is the fully qualified name for the second region to merge.
-      </para>
-      <para>Additionally, there is a Ruby script attached to <link xlink:href="https://issues.apache.org/jira/browse/HBASE-1621">HBASE-1621</link>
-      for region merging.
-      </para>
+      <para>If you feel you have too many regions and want to consolidate them, Merge is the utility
+        you need. Merge must run be done when the cluster is down. See the <link
+          xlink:href="http://ofps.oreilly.com/titles/9781449396107/performance.html">O'Reilly HBase
+          Book</link> for an example of usage. </para>
+      <para>You will need to pass 3 parameters to this application. The first one is the table name.
+        The second one is the fully qualified name of the first region to merge, like
+        "table_name,\x0A,1342956111995.7cef47f192318ba7ccc75b1bbf27a82b.". The third one is the
+        fully qualified name for the second region to merge. </para>
+      <para>Additionally, there is a Ruby script attached to <link
+          xlink:href="https://issues.apache.org/jira/browse/HBASE-1621">HBASE-1621</link> for region
+        merging. </para>
     </section>
   </section>
 
-    <section xml:id="node.management"><title>Node Management</title>
-     <section xml:id="decommission"><title>Node Decommission</title>
-        <para>You can stop an individual RegionServer by running the following
-            script in the HBase directory on the particular  node:
-            <programlisting>$ ./bin/hbase-daemon.sh stop regionserver</programlisting>
-            The RegionServer will first close all regions and then shut itself down.
-            On shutdown, the RegionServer's ephemeral node in ZooKeeper will expire.
-            The master will notice the RegionServer gone and will treat it as
-            a 'crashed' server; it will reassign the nodes the RegionServer was carrying.
-            <note><title>Disable the Load Balancer before Decommissioning a node</title>
-             <para>If the load balancer runs while a node is shutting down, then
-                 there could be contention between the Load Balancer and the
-                 Master's recovery of the just decommissioned RegionServer.
-                 Avoid any problems by disabling the balancer first.
-                 See <xref linkend="lb" /> below.
-             </para>
-            </note>
-        </para>
-        <para>
-        A downside to the above stop of a RegionServer is that regions could be offline for
-        a good period of time.  Regions are closed in order.  If many regions on the server, the
-        first region to close may not be back online until all regions close and after the master
-        notices the RegionServer's znode gone.  In Apache HBase 0.90.2, we added facility for having
-        a node gradually shed its load and then shutdown itself down. Apache HBase 0.90.2 added the
-            <filename>graceful_stop.sh</filename> script.  Here is its usage:
-            <programlisting>$ ./bin/graceful_stop.sh
+  <section xml:id="node.management">
+    <title>Node Management</title>
+    <section xml:id="decommission">
+      <title>Node Decommission</title>
+      <para>You can stop an individual RegionServer by running the following script in the HBase
+        directory on the particular node:</para>
+      <programlisting>$ ./bin/hbase-daemon.sh stop regionserver</programlisting>
+      <para> The RegionServer will first close all regions and then shut itself down. On shutdown,
+        the RegionServer's ephemeral node in ZooKeeper will expire. The master will notice the
+        RegionServer gone and will treat it as a 'crashed' server; it will reassign the nodes the
+        RegionServer was carrying. </para>
+      <note>
+        <title>Disable the Load Balancer before Decommissioning a node</title>
+        <para>If the load balancer runs while a node is shutting down, then there could be
+          contention between the Load Balancer and the Master's recovery of the just decommissioned
+          RegionServer. Avoid any problems by disabling the balancer first. See <xref linkend="lb"/>
+          below. </para>
+      </note>
+      <para> A downside to the above stop of a RegionServer is that regions could be offline for a
+        good period of time. Regions are closed in order. If many regions on the server, the first
+        region to close may not be back online until all regions close and after the master notices
+        the RegionServer's znode gone. In Apache HBase 0.90.2, we added facility for having a node
+        gradually shed its load and then shutdown itself down. Apache HBase 0.90.2 added the
+          <filename>graceful_stop.sh</filename> script. Here is its usage:</para>
+      <programlisting>$ ./bin/graceful_stop.sh
 Usage: graceful_stop.sh [--config &amp;conf-dir>] [--restart] [--reload] [--thrift] [--rest] &amp;hostname>
  thrift      If we should stop/start thrift before/after the hbase stop/start
  rest        If we should stop/start rest before/after the hbase stop/start
@@ -516,372 +559,430 @@ Usage: graceful_stop.sh [--config &amp;conf-dir>] [--restart] [--reload] [--thri
  reload      Move offloaded regions back on to the stopped server
  debug       Move offloaded regions back on to the stopped server
  hostname    Hostname of server we are to stop</programlisting>
+      <para> To decommission a loaded RegionServer, run the following: <command>$
+          ./bin/graceful_stop.sh HOSTNAME</command> where <varname>HOSTNAME</varname> is the host
+        carrying the RegionServer you would decommission. </para>
+      <note>
+        <title>On <varname>HOSTNAME</varname></title>
+        <para>The <varname>HOSTNAME</varname> passed to <filename>graceful_stop.sh</filename> must
+          match the hostname that hbase is using to identify RegionServers. Check the list of
+          RegionServers in the master UI for how HBase is referring to servers. Its usually hostname
+          but can also be FQDN. Whatever HBase is using, this is what you should pass the
+            <filename>graceful_stop.sh</filename> decommission script. If you pass IPs, the script
+          is not yet smart enough to make a hostname (or FQDN) of it and so it will fail when it
+          checks if server is currently running; the graceful unloading of regions will not run.
         </para>
-        <para>
-            To decommission a loaded RegionServer, run the following:
-            <programlisting>$ ./bin/graceful_stop.sh HOSTNAME</programlisting>
-            where <varname>HOSTNAME</varname> is the host carrying the RegionServer
-            you would decommission.
-            <note><title>On <varname>HOSTNAME</varname></title>
-                <para>The <varname>HOSTNAME</varname> passed to <filename>graceful_stop.sh</filename>
-            must match the hostname that hbase is using to identify RegionServers.
-            Check the list of RegionServers in the master UI for how HBase is
-            referring to servers. Its usually hostname but can also be FQDN.
-            Whatever HBase is using, this is what you should pass the
-            <filename>graceful_stop.sh</filename> decommission
-            script.  If you pass IPs, the script is not yet smart enough to make
-            a hostname (or FQDN) of it and so it will fail when it checks if server is
-            currently running; the graceful unloading of regions will not run.
-            </para>
-        </note> The <filename>graceful_stop.sh</filename> script will move the regions off the
-            decommissioned RegionServer one at a time to minimize region churn.
-            It will verify the region deployed in the new location before it
-            will moves the next region and so on until the decommissioned server
-            is carrying zero regions.  At this point, the <filename>graceful_stop.sh</filename>
-            tells the RegionServer <command>stop</command>.  The master will at this point notice the
-            RegionServer gone but all regions will have already been redeployed
-            and because the RegionServer went down cleanly, there will be no
-            WAL logs to split.
-            <note xml:id="lb"><title>Load Balancer</title>
-            <para>
-                It is assumed that the Region Load Balancer is disabled while the
-                <command>graceful_stop</command> script runs (otherwise the balancer
-                and the decommission script will end up fighting over region deployments).
-                Use the shell to disable the balancer:
-                <programlisting>hbase(main):001:0> balance_switch false
+      </note>
+      <para> The <filename>graceful_stop.sh</filename> script will move the regions off the
+        decommissioned RegionServer one at a time to minimize region churn. It will verify the
+        region deployed in the new location before it will moves the next region and so on until the
+        decommissioned server is carrying zero regions. At this point, the
+          <filename>graceful_stop.sh</filename> tells the RegionServer <command>stop</command>. The
+        master will at this point notice the RegionServer gone but all regions will have already
+        been redeployed and because the RegionServer went down cleanly, there will be no WAL logs to
+        split. </para>
+      <note xml:id="lb">
+        <title>Load Balancer</title>
+        <para> It is assumed that the Region Load Balancer is disabled while the
+            <command>graceful_stop</command> script runs (otherwise the balancer and the
+          decommission script will end up fighting over region deployments). Use the shell to
+          disable the balancer:</para>
+        <programlisting>hbase(main):001:0> balance_switch false
 true
 0 row(s) in 0.3590 seconds</programlisting>
-This turns the balancer OFF.  To reenable, do:
-                <programlisting>hbase(main):001:0> balance_switch true
+        <para> This turns the balancer OFF. To reenable, do:</para>
+        <programlisting>hbase(main):001:0> balance_switch true
 false
 0 row(s) in 0.3590 seconds</programlisting>
-            </para>
-            <para>The <command>graceful_stop</command> will check the balancer
-                and if enabled, will turn it off before it goes to work.  If it
-                exits prematurely because of error, it will not have reset the
-                balancer.  Hence, it is better to manage the balancer apart from
-                <command>graceful_stop</command> reenabling it after you are done
-                w/ graceful_stop.
-            </para>
-        </note>
+        <para>The <command>graceful_stop</command> will check the balancer and if enabled, will turn
+          it off before it goes to work. If it exits prematurely because of error, it will not have
+          reset the balancer. Hence, it is better to manage the balancer apart from
+            <command>graceful_stop</command> reenabling it after you are done w/ graceful_stop.
         </para>
-        <section xml:id="draining.servers">
-            <title>Decommissioning several Regions Servers concurrently</title>
-            <para>If you have a large cluster, you may want to
-            decommission more than one machine at a time by gracefully
-            stopping mutiple RegionServers concurrently.
-            To gracefully drain multiple regionservers at the
-	    same time, RegionServers can be put into a "draining"
-	    state.  This is done by marking a RegionServer as a
-	    draining node by creating an entry in ZooKeeper under the
-        <filename>hbase_root/draining</filename> znode.  This znode has format
-        <programlisting>name,port,startcode</programlisting> just like the regionserver entries
-        under <filename>hbase_root/rs</filename> znode.
-	    </para>
-	    <para>Without this facility, decommissioning mulitple nodes
-	    may be non-optimal because regions that are being drained
-	    from one region server may be moved to other regionservers that
-	    are also draining.  Marking RegionServers to be in the
-        draining state prevents this from happening<footnote><para>See
-	    this <link xlink:href="http://inchoate-clatter.blogspot.com/2012/03/hbase-ops-automation.html">blog
-            post</link> for more details.</para></footnote>.
-	    </para>
-        </section>
+      </note>
+      <section xml:id="draining.servers">
+        <title>Decommissioning several Regions Servers concurrently</title>
+        <para>If you have a large cluster, you may want to decommission more than one machine at a
+          time by gracefully stopping mutiple RegionServers concurrently. To gracefully drain
+          multiple regionservers at the same time, RegionServers can be put into a "draining" state.
+          This is done by marking a RegionServer as a draining node by creating an entry in
+          ZooKeeper under the <filename>hbase_root/draining</filename> znode. This znode has format
+            <code>name,port,startcode</code> just like the regionserver entries under
+            <filename>hbase_root/rs</filename> znode. </para>
+        <para>Without this facility, decommissioning mulitple nodes may be non-optimal because
+          regions that are being drained from one region server may be moved to other regionservers
+          that are also draining. Marking RegionServers to be in the draining state prevents this
+          from happening<footnote>
+            <para>See this <link
+                xlink:href="http://inchoate-clatter.blogspot.com/2012/03/hbase-ops-automation.html"
+                >blog post</link> for more details.</para>
+          </footnote>. </para>
+      </section>
 
-        <section xml:id="bad.disk">
-            <title>Bad or Failing Disk</title>
-            <para>It is good having <xref linkend="dfs.datanode.failed.volumes.tolerated" /> set if you have a decent number of disks
-            per machine for the case where a disk plain dies.  But usually disks do the "John Wayne" -- i.e. take a while
-            to go down spewing errors in <filename>dmesg</filename> -- or for some reason, run much slower than their
-            companions.  In this case you want to decommission the disk.  You have two options.  You can
-            <link xlink:href="http://wiki.apache.org/hadoop/FAQ#I_want_to_make_a_large_cluster_smaller_by_taking_out_a_bunch_of_nodes_simultaneously._How_can_this_be_done.3F">decommission the datanode</link>
-            or, less disruptive in that only the bad disks data will be rereplicated, can stop the datanode,
-            unmount the bad volume (You can't umount a volume while the datanode is using it), and then restart the
-            datanode (presuming you have set dfs.datanode.failed.volumes.tolerated > 0).  The regionserver will
-            throw some errors in its logs as it recalibrates where to get its data from -- it will likely
-            roll its WAL log too -- but in general but for some latency spikes, it should keep on chugging.
-            <note>
-                <title>Short Circuit Reads</title>
-                <para>If you are doing short-circuit reads, you will have to move the regions off the regionserver
-                    before you stop the datanode; when short-circuiting reading, though chmod'd so regionserver cannot
-                    have access, because it already has the files open, it will be able to keep reading the file blocks
-                    from the bad disk even though the datanode is down.  Move the regions back after you restart the
-                datanode.</para>
-            </note>
-            </para>
-        </section>
-        </section>
-        <section xml:id="rolling">
-            <title>Rolling Restart</title>
-        <para>
-            You can also ask this script to restart a RegionServer after the shutdown
-            AND move its old regions back into place.  The latter you might do to
-            retain data locality.  A primitive rolling restart might be effected by
-            running something like the following:
-            <programlisting>$ for i in `cat conf/regionservers|sort`; do ./bin/graceful_stop.sh --restart --reload --debug $i; done &amp;> /tmp/log.txt &amp;
+      <section xml:id="bad.disk">
+        <title>Bad or Failing Disk</title>
+        <para>It is good having <xref linkend="dfs.datanode.failed.volumes.tolerated"/> set if you
+          have a decent number of disks per machine for the case where a disk plain dies. But
+          usually disks do the "John Wayne" -- i.e. take a while to go down spewing errors in
+            <filename>dmesg</filename> -- or for some reason, run much slower than their companions.
+          In this case you want to decommission the disk. You have two options. You can <link
+            xlink:href="http://wiki.apache.org/hadoop/FAQ#I_want_to_make_a_large_cluster_smaller_by_taking_out_a_bunch_of_nodes_simultaneously._How_can_this_be_done.3F"
+            >decommission the datanode</link> or, less disruptive in that only the bad disks data
+          will be rereplicated, can stop the datanode, unmount the bad volume (You can't umount a
+          volume while the datanode is using it), and then restart the datanode (presuming you have
+          set dfs.datanode.failed.volumes.tolerated > 0). The regionserver will throw some errors in
+          its logs as it recalibrates where to get its data from -- it will likely roll its WAL log
+          too -- but in general but for some latency spikes, it should keep on chugging. </para>
+        <note>
+          <title>Short Circuit Reads</title>
+          <para>If you are doing short-circuit reads, you will have to move the regions off the
+            regionserver before you stop the datanode; when short-circuiting reading, though chmod'd
+            so regionserver cannot have access, because it already has the files open, it will be
+            able to keep reading the file blocks from the bad disk even though the datanode is down.
+            Move the regions back after you restart the datanode.</para>
+        </note>
+      </section>
+    </section>
+    <section xml:id="rolling">
+      <title>Rolling Restart</title>
+      <para> You can also ask this script to restart a RegionServer after the shutdown AND move its
+        old regions back into place. The latter you might do to retain data locality. A primitive
+        rolling restart might be effected by running something like the following:</para>
+      <screen>$ for i in `cat conf/regionservers|sort`; do ./bin/graceful_stop.sh --restart --reload --debug $i; done &amp;> /tmp/log.txt &amp;
+            </screen>
+      <para> Tail the output of <filename>/tmp/log.txt</filename> to follow the scripts progress.
+        The above does RegionServers only. The script will also disable the load balancer before
+        moving the regions. You'd need to do the master update separately. Do it before you run the
+        above script. Here is a pseudo-script for how you might craft a rolling restart script: </para>
+      <orderedlist>
+        <listitem>
+          <para>Untar your release, make sure of its configuration and then rsync it across the
+            cluster. If this is 0.90.2, patch it with HBASE-3744 and HBASE-3756. </para>
+        </listitem>
+        <listitem>
+          <para>Run hbck to ensure the cluster consistent
+            <programlisting>$ ./bin/hbase hbck</programlisting> Effect repairs if inconsistent.
+          </para>
+        </listitem>
+        <listitem>
+          <para>Restart the Master:
+            <programlisting>$ ./bin/hbase-daemon.sh stop master; ./bin/hbase-daemon.sh start master</programlisting>
+          </para>
+        </listitem>
+        <listitem>
+          <para>Run the <filename>graceful_stop.sh</filename> script per RegionServer. For
+            example:</para>
+          <programlisting>$ for i in `cat conf/regionservers|sort`; do ./bin/graceful_stop.sh --restart --reload --debug $i; done &amp;> /tmp/log.txt &amp;
             </programlisting>
-            Tail the output of <filename>/tmp/log.txt</filename> to follow the scripts
-            progress. The above does RegionServers only.  The script will also disable the
-            load balancer before moving the regions.  You'd need to do the master
-            update separately.  Do it before you run the above script.
-            Here is a pseudo-script for how you might craft a rolling restart script:
-            <orderedlist>
-                <listitem><para>Untar your release, make sure of its configuration and
-                        then rsync it across the cluster. If this is 0.90.2, patch it
-                        with HBASE-3744 and HBASE-3756.
-                    </para>
-                </listitem>
-                <listitem>
-                    <para>Run hbck to ensure the cluster consistent
-                        <programlisting>$ ./bin/hbase hbck</programlisting>
-                    Effect repairs if inconsistent.
-                    </para>
-                </listitem>
-                <listitem>
-                    <para>Restart the Master: <programlisting>$ ./bin/hbase-daemon.sh stop master; ./bin/hbase-daemon.sh start master</programlisting>
-                    </para>
-                </listitem>
-                <listitem>
-                     <para>Run the <filename>graceful_stop.sh</filename> script per RegionServer.  For example:
-            <programlisting>$ for i in `cat conf/regionservers|sort`; do ./bin/graceful_stop.sh --restart --reload --debug $i; done &amp;> /tmp/log.txt &amp;
-            </programlisting>
-                     If you are running thrift or rest servers on the RegionServer, pass --thrift or --rest options (See usage
-                     for <filename>graceful_stop.sh</filename> script).
-                 </para>
-                </listitem>
-                <listitem>
-                    <para>Restart the Master again.  This will clear out dead servers list and reenable the balancer.
-                    </para>
-                </listitem>
-                <listitem>
-                    <para>Run hbck to ensure the cluster is consistent.
-                    </para>
-                </listitem>
-            </orderedlist>
-        </para>
-	<para>It is important to drain HBase regions slowly when
-	restarting regionservers. Otherwise, multiple regions go
-	offline simultaneously as they are re-assigned to other
-	nodes. Depending on your usage patterns, this might not be
-	desirable.
-	</para>
+          <para> If you are running thrift or rest servers on the RegionServer, pass --thrift or
+            --rest options (See usage for <filename>graceful_stop.sh</filename> script). </para>
+        </listitem>
+        <listitem>
+          <para>Restart the Master again. This will clear out dead servers list and reenable the
+            balancer. </para>
+        </listitem>
+        <listitem>
+          <para>Run hbck to ensure the cluster is consistent. </para>
+        </listitem>
+      </orderedlist>
+      <para>It is important to drain HBase regions slowly when restarting regionservers. Otherwise,
+        multiple regions go offline simultaneously as they are re-assigned to other nodes. Depending
+        on your usage patterns, this might not be desirable. </para>
     </section>
     <section xml:id="adding.new.node">
-        <title>Adding a New Node</title>
-        <para>Adding a new regionserver in HBase is essentially free, you simply start it like this:
-              <programlisting>$ ./bin/hbase-daemon.sh start regionserver</programlisting>
-              and it will register itself with the master. Ideally you also started a DataNode on the same
-              machine so that the RS can eventually start to have local files. If you rely on ssh to start your
-              daemons, don't forget to add the new hostname in <filename>conf/regionservers</filename> on the master.
-        </para>
-        <para>At this point the region server isn't serving data because no regions have moved to it yet. If the balancer is
-              enabled, it will start moving regions to the new RS. On a small/medium cluster this can have a very adverse effect
-              on latency as a lot of regions will be offline at the same time. It is thus recommended to disable the balancer
-              the same way it's done when decommissioning a node and move the regions manually (or even better, using a script
-              that moves them one by one).
-        </para>
-        <para>The moved regions will all have 0% locality and won't have any blocks in cache so the region server will have
-              to use the network to serve requests. Apart from resulting in higher latency, it may also be able to use all of
-              your network card's capacity. For practical purposes, consider that a standard 1GigE NIC won't be able to read
-              much more than <emphasis>100MB/s</emphasis>. In this case, or if you are in a OLAP environment and require having
-              locality, then it is recommended to major compact the moved regions.
-        </para>
+      <title>Adding a New Node</title>
+      <para>Adding a new regionserver in HBase is essentially free, you simply start it like this:
+          <command>$ ./bin/hbase-daemon.sh start regionserver</command> and it will register itself
+        with the master. Ideally you also started a DataNode on the same machine so that the RS can
+        eventually start to have local files. If you rely on ssh to start your daemons, don't forget
+        to add the new hostname in <filename>conf/regionservers</filename> on the master. </para>
+      <para>At this point the region server isn't serving data because no regions have moved to it
+        yet. If the balancer is enabled, it will start moving regions to the new RS. On a
+        small/medium cluster this can have a very adverse effect on latency as a lot of regions will
+        be offline at the same time. It is thus recommended to disable the balancer the same way
+        it's done when decommissioning a node and move the regions manually (or even better, using a
+        script that moves them one by one). </para>
+      <para>The moved regions will all have 0% locality and won't have any blocks in cache so the
+        region server will have to use the network to serve requests. Apart from resulting in higher
+        latency, it may also be able to use all of your network card's capacity. For practical
+        purposes, consider that a standard 1GigE NIC won't be able to read much more than
+          <emphasis>100MB/s</emphasis>. In this case, or if you are in a OLAP environment and
+        require having locality, then it is recommended to major compact the moved regions. </para>
 
     </section>
-    </section>  <!--  node mgt -->
+  </section>
+  <!--  node mgt -->
 
   <section xml:id="hbase_metrics">
-  <title>HBase Metrics</title>
-  <section xml:id="metric_setup">
-  <title>Metric Setup</title>
-  <para>See <link xlink:href="http://hbase.apache.org/metrics.html">Metrics</link> for
-  an introduction and how to enable Metrics emission.  Still valid for HBase 0.94.x.
-  </para>
-  <para>For HBase 0.95.x and up, see <link xlink:href="http://hadoop.apache.org/docs/current/api/org/apache/hadoop/metrics2/package-summary.html"/>
-  </para>
-  </section>
-   <section xml:id="rs_metrics_ganglia">
-     <title>Warning To Ganglia Users</title>
-     <para>Warning to Ganglia Users:  by default, HBase will emit a LOT of metrics per RegionServer which may swamp your installation.
-     Options include either increasing Ganglia server capacity, or configuring HBase to emit fewer metrics.
-     </para>
-   </section>
-   <section xml:id="rs_metrics">
-   <title>Most Important RegionServer Metrics</title>
-          <section xml:id="hbase.regionserver.blockCacheHitCachingRatio"><title><varname>blockCacheExpressCachingRatio (formerly blockCacheHitCachingRatio)</varname></title>
-          <para>Block cache hit caching ratio (0 to 100).  The cache-hit ratio for reads configured to look in the cache (i.e., cacheBlocks=true). </para>
-		  </section>
-          <section xml:id="hbase.regionserver.callQueueLength"><title><varname>callQueueLength</varname></title>
-          <para>Point in time length of the RegionServer call queue.  If requests arrive faster than the RegionServer handlers can process
-          them they will back up in the callQueue.</para>
-		  </section>
-          <section xml:id="hbase.regionserver.compactionQueueSize"><title><varname>compactionQueueLength (formerly compactionQueueSize)</varname></title>
-          <para>Point in time length of the compaction queue.  This is the number of Stores in the RegionServer that have been targeted for compaction.</para>
-		  </section>
-          <section xml:id="hbase.regionserver.flushQueueSize"><title><varname>flushQueueSize</varname></title>
-          <para>Point in time number of enqueued regions in the MemStore awaiting flush.</para>
-		  </section>
-          <section xml:id="hbase.regionserver.hdfsBlocksLocalityIndex"><title><varname>hdfsBlocksLocalityIndex</varname></title>
-          <para>Point in time percentage of HDFS blocks that are local to this RegionServer.  The higher the better.  </para>
-		  </section>
-          <section xml:id="hbase.regionserver.memstoreSizeMB"><title><varname>memstoreSizeMB</varname></title>
-          <para>Point in time sum of all the memstore sizes in this RegionServer (MB).  Watch for this nearing or exceeding
-          the configured high-watermark for MemStore memory in the RegionServer. </para>
-		  </section>
-          <section xml:id="hbase.regionserver.regions"><title><varname>numberOfOnlineRegions</varname></title>
-          <para>Point in time number of regions served by the RegionServer.  This is an important metric to track for RegionServer-Region density.
-          </para>
-		  </section>
-          <section xml:id="hbase.regionserver.readRequestsCount"><title><varname>readRequestsCount</varname></title>
-          <para>Number of read requests for this RegionServer since startup.  Note:  this is a 32-bit integer and can roll. </para>
-		  </section>
-          <section xml:id="hbase.regionserver.slowHLogAppendCount"><title><varname>slowHLogAppendCount</varname></title>
-          <para>Number of slow HLog append writes for this RegionServer since startup, where "slow" is > 1 second.  This is
-          a good "canary" metric for HDFS. </para>
-		  </section>
-         <section xml:id="hbase.regionserver.usedHeapMB"><title><varname>usedHeapMB</varname></title>
-          <para>Point in time amount of memory used by the RegionServer (MB).</para>
-		  </section>
-          <section xml:id="hbase.regionserver.writeRequestsCount"><title><varname>writeRequestsCount</varname></title>
-          <para>Number of write requests for this RegionServer since startup.  Note:  this is a 32-bit integer and can roll. </para>
-		  </section>
+    <title>HBase Metrics</title>
+    <section xml:id="metric_setup">
+      <title>Metric Setup</title>
+      <para>See <link xlink:href="http://hbase.apache.org/metrics.html">Metrics</link> for an
+        introduction and how to enable Metrics emission. Still valid for HBase 0.94.x. </para>
+      <para>For HBase 0.95.x and up, see <link
+          xlink:href="http://hadoop.apache.org/docs/current/api/org/apache/hadoop/metrics2/package-summary.html"
+        />
+      </para>
+    </section>
+    <section xml:id="rs_metrics_ganglia">
+      <title>Warning To Ganglia Users</title>
+      <para>Warning to Ganglia Users: by default, HBase will emit a LOT of metrics per RegionServer
+        which may swamp your installation. Options include either increasing Ganglia server
+        capacity, or configuring HBase to emit fewer metrics. </para>
+    </section>
+    <section xml:id="rs_metrics">
+      <title>Most Important RegionServer Metrics</title>
+      <section xml:id="hbase.regionserver.blockCacheHitCachingRatio">
+        <title><varname>blockCacheExpressCachingRatio (formerly
+          blockCacheHitCachingRatio)</varname></title>
+        <para>Block cache hit caching ratio (0 to 100). The cache-hit ratio for reads configured to
+          look in the cache (i.e., cacheBlocks=true). </para>
+      </section>
+      <section xml:id="hbase.regionserver.callQueueLength">
+        <title><varname>callQueueLength</varname></title>
+        <para>Point in time length of the RegionServer call queue. If requests arrive faster than
+          the RegionServer handlers can process them they will back up in the callQueue.</para>
+      </section>
+      <section xml:id="hbase.regionserver.compactionQueueSize">
+        <title><varname>compactionQueueLength (formerly compactionQueueSize)</varname></title>
+        <para>Point in time length of the compaction queue. This is the number of Stores in the
+          RegionServer that have been targeted for compaction.</para>
+      </section>
+      <section xml:id="hbase.regionserver.flushQueueSize">
+        <title><varname>flushQueueSize</varname></title>
+        <para>Point in time number of enqueued regions in the MemStore awaiting flush.</para>
+      </section>
+      <section xml:id="hbase.regionserver.hdfsBlocksLocalityIndex">
+        <title><varname>hdfsBlocksLocalityIndex</varname></title>
+        <para>Point in time percentage of HDFS blocks that are local to this RegionServer. The
+          higher the better. </para>
+      </section>
+      <section xml:id="hbase.regionserver.memstoreSizeMB">
+        <title><varname>memstoreSizeMB</varname></title>
+        <para>Point in time sum of all the memstore sizes in this RegionServer (MB). Watch for this
+          nearing or exceeding the configured high-watermark for MemStore memory in the
+          RegionServer. </para>
+      </section>
+      <section xml:id="hbase.regionserver.regions">
+        <title><varname>numberOfOnlineRegions</varname></title>
+        <para>Point in time number of regions served by the RegionServer. This is an important
+          metric to track for RegionServer-Region density. </para>
+      </section>
+      <section xml:id="hbase.regionserver.readRequestsCount">
+        <title><varname>readRequestsCount</varname></title>
+        <para>Number of read requests for this RegionServer since startup. Note: this is a 32-bit
+          integer and can roll. </para>
+      </section>
+      <section xml:id="hbase.regionserver.slowHLogAppendCount">
+        <title><varname>slowHLogAppendCount</varname></title>
+        <para>Number of slow HLog append writes for this RegionServer since startup, where "slow" is
+          > 1 second. This is a good "canary" metric for HDFS. </para>
+      </section>
+      <section xml:id="hbase.regionserver.usedHeapMB">
+        <title><varname>usedHeapMB</varname></title>
+        <para>Point in time amount of memory used by the RegionServer (MB).</para>
+      </section>
+      <section xml:id="hbase.regionserver.writeRequestsCount">
+        <title><varname>writeRequestsCount</varname></title>
+        <para>Number of write requests for this RegionServer since startup. Note: this is a 32-bit
+          integer and can roll. </para>
+      </section>
 
-   </section>
-   <section xml:id="rs_metrics_other">
-   <title>Other RegionServer Metrics</title>
-          <section xml:id="hbase.regionserver.blockCacheCount"><title><varname>blockCacheCount</varname></title>
-          <para>Point in time block cache item count in memory.  This is the number of blocks of StoreFiles (HFiles) in the cache.</para>
-		  </section>
-         <section xml:id="hbase.regionserver.blockCacheEvictedCount"><title><varname>blockCacheEvictedCount</varname></title>
-          <para>Number of blocks that had to be evicted from the block cache due to heap size constraints by RegionServer since startup.</para>
-		  </section>
-         <section xml:id="hbase.regionserver.blockCacheFree"><title><varname>blockCacheFreeMB</varname></title>
-          <para>Point in time block cache memory available (MB).</para>
-		  </section>
-          <section xml:id="hbase.regionserver.blockCacheHitCount"><title><varname>blockCacheHitCount</varname></title>
-          <para>Number of blocks of StoreFiles (HFiles) read from the cache by RegionServer since startup.</para>
-		  </section>
-          <section xml:id="hbase.regionserver.blockCacheHitRatio"><title><varname>blockCacheHitRatio</varname></title>
-          <para>Block cache hit ratio (0 to 100) from RegionServer startup.  Includes all read requests, although those with cacheBlocks=false
-           will always read from disk and be counted as a "cache miss", which means that full-scan MapReduce jobs can affect
-           this metric significantly.</para>
-		  </section>
-          <section xml:id="hbase.regionserver.blockCacheMissCount"><title><varname>blockCacheMissCount</varname></title>
-          <para>Number of blocks of StoreFiles (HFiles) requested but not read from the cache from RegionServer startup.</para>
-		  </section>
-          <section xml:id="hbase.regionserver.blockCacheSize"><title><varname>blockCacheSizeMB</varname></title>
-          <para>Point in time block cache size in memory (MB).  i.e., memory in use by the BlockCache</para>
-		  </section>
-          <section xml:id="hbase.regionserver.fsPreadLatency"><title><varname>fsPreadLatency*</varname></title>
-          <para>There are several filesystem positional read latency (ms) metrics, all measured from RegionServer startup.</para>
-		  </section>
-          <section xml:id="hbase.regionserver.fsReadLatency"><title><varname>fsReadLatency*</varname></title>
-          <para>There are several filesystem read latency (ms) metrics, all measured from RegionServer startup.  The issue with
-          interpretation is that ALL reads go into this metric (e.g., single-record Gets, full table Scans), including
-          reads required for compactions.  This metric is only interesting "over time" when comparing
-          major releases of HBase or your own code.</para>
-		  </section>
-          <section xml:id="hbase.regionserver.fsWriteLatency"><title><varname>fsWriteLatency*</varname></title>
-          <para>There are several filesystem write latency (ms) metrics, all measured from RegionServer startup.  The issue with
-          interpretation is that ALL writes go into this metric (e.g., single-record Puts, full table re-writes due to compaction).
-          This metric is only interesting "over time" when comparing
-          major releases of HBase or your own code.</para>
-		  </section>
-          <section xml:id="hbase.regionserver.stores"><title><varname>NumberOfStores</varname></title>
-          <para>Point in time number of Stores open on the RegionServer.  A Store corresponds to a ColumnFamily.  For example,
-          if a table (which contains the column family) has 3 regions on a RegionServer, there will be 3 stores open for that
-          column family. </para>
-		  </section>
-          <section xml:id="hbase.regionserver.storeFiles"><title><varname>NumberOfStorefiles</varname></title>
-          <para>Point in time number of StoreFiles open on the RegionServer.  A store may have more than one StoreFile (HFile).</para>
-		  </section>
-          <section xml:id="hbase.regionserver.requests"><title><varname>requestsPerSecond</varname></title>
-          <para>Point in time number of read and write requests.  Requests correspond to RegionServer RPC calls,
-           thus a single Get will result in 1 request, but a Scan with caching set to 1000 will result in 1 request for each 'next' call
-            (i.e., not each row).  A bulk-load request will constitute 1 request per HFile.
-            This metric is less interesting than readRequestsCount and writeRequestsCount in terms of measuring activity
-            due to this metric being periodic. </para>
-		  </section>
-          <section xml:id="hbase.regionserver.storeFileIndexSizeMB"><title><varname>storeFileIndexSizeMB</varname></title>
-          <para>Point in time sum of all the StoreFile index sizes in this RegionServer (MB)</para>
-		  </section>
-   </section>
+    </section>
+    <section xml:id="rs_metrics_other">
+      <title>Other RegionServer Metrics</title>
+      <section xml:id="hbase.regionserver.blockCacheCount">
+        <title><varname>blockCacheCount</varname></title>
+        <para>Point in time block cache item count in memory. This is the number of blocks of
+          StoreFiles (HFiles) in the cache.</para>
+      </section>
+      <section xml:id="hbase.regionserver.blockCacheEvictedCount">
+        <title><varname>blockCacheEvictedCount</varname></title>
+        <para>Number of blocks that had to be evicted from the block cache due to heap size
+          constraints by RegionServer since startup.</para>
+      </section>
+      <section xml:id="hbase.regionserver.blockCacheFree">
+        <title><varname>blockCacheFreeMB</varname></title>
+        <para>Point in time block cache memory available (MB).</para>
+      </section>
+      <section xml:id="hbase.regionserver.blockCacheHitCount">
+        <title><varname>blockCacheHitCount</varname></title>
+        <para>Number of blocks of StoreFiles (HFiles) read from the cache by RegionServer since
+          startup.</para>
+      </section>
+      <section xml:id="hbase.regionserver.blockCacheHitRatio">
+        <title><varname>blockCacheHitRatio</varname></title>
+        <para>Block cache hit ratio (0 to 100) from RegionServer startup. Includes all read
+          requests, although those with cacheBlocks=false will always read from disk and be counted
+          as a "cache miss", which means that full-scan MapReduce jobs can affect this metric
+          significantly.</para>
+      </section>
+      <section xml:id="hbase.regionserver.blockCacheMissCount">
+        <title><varname>blockCacheMissCount</varname></title>
+        <para>Number of blocks of StoreFiles (HFiles) requested but not read from the cache from
+          RegionServer startup.</para>
+      </section>
+      <section xml:id="hbase.regionserver.blockCacheSize">
+        <title><varname>blockCacheSizeMB</varname></title>
+        <para>Point in time block cache size in memory (MB). i.e., memory in use by the
+          BlockCache</para>
+      </section>
+      <section xml:id="hbase.regionserver.fsPreadLatency">
+        <title><varname>fsPreadLatency*</varname></title>
+        <para>There are several filesystem positional read latency (ms) metrics, all measured from
+          RegionServer startup.</para>
+      </section>
+      <section xml:id="hbase.regionserver.fsReadLatency">
+        <title><varname>fsReadLatency*</varname></title>
+        <para>There are several filesystem read latency (ms) metrics, all measured from RegionServer
+          startup. The issue with interpretation is that ALL reads go into this metric (e.g.,
+          single-record Gets, full table Scans), including reads required for compactions. This
+          metric is only interesting "over time" when comparing major releases of HBase or your own
+          code.</para>
+      </section>
+      <section xml:id="hbase.regionserver.fsWriteLatency">
+        <title><varname>fsWriteLatency*</varname></title>
+        <para>There are several filesystem write latency (ms) metrics, all measured from
+          RegionServer startup. The issue with interpretation is that ALL writes go into this metric
+          (e.g., single-record Puts, full table re-writes due to compaction). This metric is only
+          interesting "over time" when comparing major releases of HBase or your own code.</para>
+      </section>
+      <section xml:id="hbase.regionserver.stores">
+        <title><varname>NumberOfStores</varname></title>
+        <para>Point in time number of Stores open on the RegionServer. A Store corresponds to a
+          ColumnFamily. For example, if a table (which contains the column family) has 3 regions on
+          a RegionServer, there will be 3 stores open for that column family. </para>
+      </section>
+      <section xml:id="hbase.regionserver.storeFiles">
+        <title><varname>NumberOfStorefiles</varname></title>
+        <para>Point in time number of StoreFiles open on the RegionServer. A store may have more
+          than one StoreFile (HFile).</para>
+      </section>
+      <section xml:id="hbase.regionserver.requests">
+        <title><varname>requestsPerSecond</varname></title>
+        <para>Point in time number of read and write requests. Requests correspond to RegionServer
+          RPC calls, thus a single Get will result in 1 request, but a Scan with caching set to 1000
+          will result in 1 request for each 'next' call (i.e., not each row). A bulk-load request
+          will constitute 1 request per HFile. This metric is less interesting than
+          readRequestsCount and writeRequestsCount in terms of measuring activity due to this metric
+          being periodic. </para>
+      </section>
+      <section xml:id="hbase.regionserver.storeFileIndexSizeMB">
+        <title><varname>storeFileIndexSizeMB</varname></title>
+        <para>Point in time sum of all the StoreFile index sizes in this RegionServer (MB)</para>
+      </section>
+    </section>
   </section>
 
   <section xml:id="ops.monitoring">
-    <title >HBase Monitoring</title>
+    <title>HBase Monitoring</title>
     <section xml:id="ops.monitoring.overview">
-    <title>Overview</title>
-      <para>The following metrics are arguably the most important to monitor for each RegionServer for
-      "macro monitoring", preferably with a system like <link xlink:href="http://opentsdb.net/">OpenTSDB</link>.
-      If your cluster is having performance issues it's likely that you'll see something unusual with
-      this group.
-      </para>
-      <para>HBase:
+      <title>Overview</title>
+      <para>The following metrics are arguably the most important to monitor for each RegionServer
+        for "macro monitoring", preferably with a system like <link
+          xlink:href="http://opentsdb.net/">OpenTSDB</link>. If your cluster is having performance
+        issues it's likely that you'll see something unusual with this group. </para>
       <itemizedlist>
-      <listitem>See <xref linkend="rs_metrics"/></listitem>
+        <title>HBase:</title>
+        <listitem>
+          <para>See <xref linkend="rs_metrics"/></para>
+        </listitem>
       </itemizedlist>
-      </para>
-      <para>OS:
+
       <itemizedlist>
-      <listitem>IO Wait</listitem>
-      <listitem>User CPU</listitem>
+        <title>OS:</title>
+        <listitem>
+          <para>IO Wait</para>
+        </listitem>
+        <listitem>
+          <para>User CPU</para>
+        </listitem>
       </itemizedlist>
-      </para>
-      <para>Java:
       <itemizedlist>
-      <listitem>GC</listitem>
+        <title>Java:</title>
+        <listitem>
+          <para>GC</para>
+        </listitem>
       </itemizedlist>
-      </para>
-      <para>
-      </para>
-      <para>
-      For more information on HBase metrics, see <xref linkend="hbase_metrics"/>.
-      </para>
+      <para> For more information on HBase metrics, see <xref linkend="hbase_metrics"/>. </para>
     </section>
 
     <section xml:id="ops.slow.query">
-    <title>Slow Query Log</title>
-<para>The HBase slow query log consists of parseable JSON structures describing the properties of those client operations (Gets, Puts, Deletes, etc.) that either took too long to run, or produced too much output. The thresholds for "too long to run" and "too much output" are configurable, as described below. The output is produced inline in the main region server logs so that it is easy to discover further details from context with other logged events. It is also prepended with identifying tags <constant>(responseTooSlow)</constant>, <constant>(responseTooLarge)</constant>, <constant>(operationTooSlow)</constant>, and <constant>(operationTooLarge)</constant> in order to enable easy filtering with grep, in case the user desires to see only slow queries.
-</para>
+      <title>Slow Query Log</title>
+      <para>The HBase slow query log consists of parseable JSON structures describing the properties
+        of those client operations (Gets, Puts, Deletes, etc.) that either took too long to run, or
+        produced too much output. The thresholds for "too long to run" and "too much output" are
+        configurable, as described below. The output is produced inline in the main region server
+        logs so that it is easy to discover further details from context with other logged events.
+        It is also prepended with identifying tags <constant>(responseTooSlow)</constant>,
+          <constant>(responseTooLarge)</constant>, <constant>(operationTooSlow)</constant>, and
+          <constant>(operationTooLarge)</constant> in order to enable easy filtering with grep, in
+        case the user desires to see only slow queries. </para>
 
-<section><title>Configuration</title>
-<para>There are two configuration knobs that can be used to adjust the thresholds for when queries are logged.
-</para>
+      <section>
+        <title>Configuration</title>
+        <para>There are two configuration knobs that can be used to adjust the thresholds for when
+          queries are logged. </para>
 
-<itemizedlist>
-<listitem>
-<varname>hbase.ipc.warn.response.time</varname> Maximum number of milliseconds that a query can be run without being logged. Defaults to 10000, or 10 seconds. Can be set to -1 to disable logging by time.
-</listitem>
-<listitem><varname>hbase.ipc.warn.response.size</varname> Maximum byte size of response that a query can return without being logged. Defaults to 100 megabytes. Can be set to -1 to disable logging by size.
-</listitem>
-</itemizedlist>
-</section>
+        <itemizedlist>
+          <listitem>
+            <para><varname>hbase.ipc.warn.response.time</varname> Maximum number of milliseconds
+              that a query can be run without being logged. Defaults to 10000, or 10 seconds. Can be
+              set to -1 to disable logging by time. </para>
+          </listitem>
+          <listitem>
+            <para><varname>hbase.ipc.warn.response.size</varname> Maximum byte size of response that
+              a query can return without being logged. Defaults to 100 megabytes. Can be set to -1
+              to disable logging by size. </para>
+          </listitem>
+        </itemizedlist>
+      </section>
 
-<section><title>Metrics</title>
-<para>The slow query log exposes to metrics to JMX.
-<itemizedlist><listitem><varname>hadoop.regionserver_rpc_slowResponse</varname> a global metric reflecting the durations of all responses that triggered logging.</listitem>
-<listitem><varname>hadoop.regionserver_rpc_methodName.aboveOneSec</varname> A metric reflecting the durations of all responses that lasted for more than one second.</listitem>
-</itemizedlist>
-</para>
-</section>
+      <section>
+        <title>Metrics</title>
+        <para>The slow query log exposes to metrics to JMX.</para>
+        <itemizedlist>
+          <listitem>
+            <para><varname>hadoop.regionserver_rpc_slowResponse</varname> a global metric reflecting
+              the durations of all responses that triggered logging.</para>
+          </listitem>
+          <listitem>
+            <para><varname>hadoop.regionserver_rpc_methodName.aboveOneSec</varname> A metric
+              reflecting the durations of all responses that lasted for more than one second.</para>
+          </listitem>
+        </itemizedlist>
 
-<section><title>Output</title>
-<para>The output is tagged with operation e.g. <constant>(operationTooSlow)</constant> if the call was a client operation, such as a Put, Get, or Delete, which we expose detailed fingerprint information for. If not, it is tagged <constant>(responseTooSlow)</constant> and still produces parseable JSON output, but with less verbose information solely regarding its duration and size in the RPC itself. <constant>TooLarge</constant> is substituted for <constant>TooSlow</constant> if the response size triggered the logging, with <constant>TooLarge</constant> appearing even in the case that both size and duration triggered logging.
-</para>
-</section>
-<section><title>Example</title>
-<para>
-<programlisting>2011-09-08 10:01:25,824 WARN org.apache.hadoop.ipc.HBaseServer: (operationTooSlow): {"tables":{"riley2":{"puts":[{"totalColumns":11,"families":{"actions":[{"timestamp":1315501284459,"qualifier":"0","vlen":9667580},{"timestamp":1315501284459,"qualifier":"1","vlen":10122412},{"timestamp":1315501284459,"qualifier":"2","vlen":11104617},{"timestamp":1315501284459,"qualifier":"3","vlen":13430635}]},"row":"cfcd208495d565ef66e7dff9f98764da:0"}],"families":["actions"]}},"processingtimems":956,"client":"10.47.34.63:33623","starttimems":1315501284456,"queuetimems":0,"totalPuts":1,"class":"HRegionServer","responsesize":0,"method":"multiPut"}</programlisting>
-</para>
+      </section>
 
-<para>Note that everything inside the "tables" structure is output produced by MultiPut's fingerprint, while the rest of the information is RPC-specific, such as processing time and client IP/port. Other client operations follow the same pattern and the same general structure, with necessary differences due to the nature of the individual operations. In the case that the call is not a client operation, that detailed fingerprint information will be completely absent.
-</para>
+      <section>
+        <title>Output</title>
+        <para>The output is tagged with operation e.g. <constant>(operationTooSlow)</constant> if
+          the call was a client operation, such as a Put, Get, or Delete, which we expose detailed
+          fingerprint information for. If not, it is tagged <constant>(responseTooSlow)</constant>
+          and still produces parseable JSON output, but with less verbose information solely
+          regarding its duration and size in the RPC itself. <constant>TooLarge</constant> is
+          substituted for <constant>TooSlow</constant> if the response size triggered the logging,
+          with <constant>TooLarge</constant> appearing even in the case that both size and duration
+          triggered logging. </para>
+      </section>
+      <section>
+        <title>Example</title>
+        <para>
+          <programlisting>2011-09-08 10:01:25,824 WARN org.apache.hadoop.ipc.HBaseServer: (operationTooSlow): {"tables":{"riley2":{"puts":[{"totalColumns":11,"families":{"actions":[{"timestamp":1315501284459,"qualifier":"0","vlen":9667580},{"timestamp":1315501284459,"qualifier":"1","vlen":10122412},{"timestamp":1315501284459,"qualifier":"2","vlen":11104617},{"timestamp":1315501284459,"qualifier":"3","vlen":13430635}]},"row":"cfcd208495d565ef66e7dff9f98764da:0"}],"families":["actions"]}},"processingtimems":956,"client":"10.47.34.63:33623","starttimems":1315501284456,"queuetimems":0,"totalPuts":1,"class":"HRegionServer","responsesize":0,"method":"multiPut"}</programlisting>
+        </para>
 
-<para>This particular example, for example, would indicate that the likely cause of slowness is simply a very large (on the order of 100MB) multiput, as we can tell by the "vlen," or value length, fields of each put in the multiPut.
-</para>
-</section>
-</section>
+        <para>Note that everything inside the "tables" structure is output produced by MultiPut's
+          fingerprint, while the rest of the information is RPC-specific, such as processing time
+          and client IP/port. Other client operations follow the same pattern and the same general
+          structure, with necessary differences due to the nature of the individual operations. In
+          the case that the call is not a client operation, that detailed fingerprint information
+          will be completely absent. </para>
+
+        <para>This particular example, for example, would indicate that the likely cause of slowness
+          is simply a very large (on the order of 100MB) multiput, as we can tell by the "vlen," or
+          value length, fields of each put in the multiPut. </para>
+      </section>
+    </section>
 
 
 
@@ -889,252 +990,399 @@ false
 
   <section xml:id="cluster_replication">
     <title>Cluster Replication</title>
-    <para>See <link xlink:href="http://hbase.apache.org/replication.html">Cluster Replication</link>.
-    </para>
+    <para>See <link xlink:href="http://hbase.apache.org/replication.html">Cluster
+      Replication</link>. </para>
   </section>
   <section xml:id="ops.backup">
-    <title >HBase Backup</title>
-    <para>There are two broad strategies for performing HBase backups: backing up with a full cluster shutdown, and backing up on a live cluster.
-    Each approach has pros and cons.
-    </para>
-    <para>For additional information, see <link xlink:href="http://blog.sematext.com/2011/03/11/hbase-backup-options/">HBase Backup Options</link> over on the Sematext Blog.
-    </para>
-    <section xml:id="ops.backup.fullshutdown"><title>Full Shutdown Backup</title>
-      <para>Some environments can tolerate a periodic full shutdown of their HBase cluster, for example if it is being used a back-end analytic capacity
-      and not serving front-end web-pages.  The benefits are that the NameNode/Master are RegionServers are down, so there is no chance of missing
-      any in-flight changes to either StoreFiles or metadata.  The obvious con is that the cluster is down.  The steps include:
-      </para>
-      <section xml:id="ops.backup.fullshutdown.stop"><title>Stop HBase</title>
-        <para>
-        </para>
+    <title>HBase Backup</title>
+    <para>There are two broad strategies for performing HBase backups: backing up with a full
+      cluster shutdown, and backing up on a live cluster. Each approach has pros and cons. </para>
+    <para>For additional information, see <link
+        xlink:href="http://blog.sematext.com/2011/03/11/hbase-backup-options/">HBase Backup
+        Options</link> over on the Sematext Blog. </para>
+    <section xml:id="ops.backup.fullshutdown">
+      <title>Full Shutdown Backup</title>
+      <para>Some environments can tolerate a periodic full shutdown of their HBase cluster, for
+        example if it is being used a back-end analytic capacity and not serving front-end
+        web-pages. The benefits are that the NameNode/Master are RegionServers are down, so there is
+        no chance of missing any in-flight changes to either StoreFiles or metadata. The obvious con
+        is that the cluster is down. The steps include: </para>
+      <section xml:id="ops.backup.fullshutdown.stop">
+        <title>Stop HBase</title>
+        <para> </para>
       </section>
-      <section xml:id="ops.backup.fullshutdown.distcp"><title>Distcp</title>
-        <para>Distcp could be used to either copy the contents of the HBase directory in HDFS to either the same cluster in another directory, or
-        to a different cluster.
-        </para>
-        <para>Note:  Distcp works in this situation because the cluster is down and there are no in-flight edits to files.
-        Distcp-ing of files in the HBase directory is not generally recommended on a live cluster.
-        </para>
+      <section xml:id="ops.backup.fullshutdown.distcp">
+        <title>Distcp</title>
+        <para>Distcp could be used to either copy the contents of the HBase directory in HDFS to
+          either the same cluster in another directory, or to a different cluster. </para>
+        <para>Note: Distcp works in this situation because the cluster is down and there are no
+          in-flight edits to files. Distcp-ing of files in the HBase directory is not generally
+          recommended on a live cluster. </para>
       </section>
-      <section xml:id="ops.backup.fullshutdown.restore"><title>Restore (if needed)</title>
-        <para>The backup of the hbase directory from HDFS is copied onto the 'real' hbase directory via distcp.  The act of copying these files
-        creates new HDFS metadata, which is why a restore of the NameNode edits from the time of the HBase backup isn't required for this kind of
-        restore, because it's a restore (via distcp) of a specific HDFS directory (i.e., the HBase part) not the entire HDFS file-system.
-        </para>
+      <section xml:id="ops.backup.fullshutdown.restore">
+        <title>Restore (if needed)</title>
+        <para>The backup of the hbase directory from HDFS is copied onto the 'real' hbase directory
+          via distcp. The act of copying these files creates new HDFS metadata, which is why a
+          restore of the NameNode edits from the time of the HBase backup isn't required for this
+          kind of restore, because it's a restore (via distcp) of a specific HDFS directory (i.e.,
+          the HBase part) not the entire HDFS file-system. </para>
       </section>
     </section>
-    <section xml:id="ops.backup.live.replication"><title>Live Cluster Backup - Replication</title>
-      <para>This approach assumes that there is a second cluster.
-      See the HBase page on <link xlink:href="http://hbase.apache.org/replication.html">replication</link> for more information.
-      </para>
+    <section xml:id="ops.backup.live.replication">
+      <title>Live Cluster Backup - Replication</title>
+      <para>This approach assumes that there is a second cluster. See the HBase page on <link
+          xlink:href="http://hbase.apache.org/replication.html">replication</link> for more
+        information. </para>
     </section>
-    <section xml:id="ops.backup.live.copytable"><title>Live Cluster Backup - CopyTable</title>
-      <para>The <xref linkend="copytable" /> utility could either be used to copy data from one table to another on the
-      same cluster, or to copy data to another table on another cluster.
-      </para>
+    <section xml:id="ops.backup.live.copytable">
+      <title>Live Cluster Backup - CopyTable</title>
+      <para>The <xref linkend="copytable"/> utility could either be used to copy data from one table
+        to another on the same cluster, or to copy data to another table on another cluster. </para>
       <para>Since the cluster is up, there is a risk that edits could be missed in the copy process.
       </para>
     </section>
-    <section xml:id="ops.backup.live.export"><title>Live Cluster Backup - Export</title>
-      <para>The <xref linkend="export" /> approach dumps the content of a table to HDFS on the same cluster.  To restore the data, the
-      <xref linkend="import" /> utility would be used.
-      </para>
-      <para>Since the cluster is up, there is a risk that edits could be missed in the export process.
-      </para>
+    <section xml:id="ops.backup.live.export">
+      <title>Live Cluster Backup - Export</title>
+      <para>The <xref linkend="export"/> approach dumps the content of a table to HDFS on the same
+        cluster. To restore the data, the <xref linkend="import"/> utility would be used. </para>
+      <para>Since the cluster is up, there is a risk that edits could be missed in the export
+        process. </para>
     </section>
-  </section>  <!--  backup -->
+  </section>
+  <!--  backup -->
 
   <section xml:id="ops.snapshots">
     <title>HBase Snapshots</title>
-    <para>HBase Snapshots allow you to take a snapshot of a table without too much impact on Region Servers.
-      Snapshot, Clone and restore operations don't involve data copying.
-      Also, Exporting the snapshot to another cluster doesn't have impact on the Region Servers.
-    </para>
-    <para>Prior to version 0.94.6, the only way to backup or to clone a table is to use CopyTable/ExportTable,
-      or to copy all the hfiles in HDFS after disabling the table.
-      The disadvantages of these methods are that you can degrade region server performance
-      (Copy/Export Table) or you need to disable the table, that means no reads or writes;
-      and this is usually unacceptable.
-    </para>
-    <section xml:id="ops.snapshots.configuration"><title>Configuration</title>
-      <para>To turn on the snapshot support just set the
-        <varname>hbase.snapshot.enabled</varname> property to true.
-        (Snapshots are enabled by default in 0.95+ and off by default in 0.94.6+)
-        <programlisting>
+    <para>HBase Snapshots allow you to take a snapshot of a table without too much impact on Region
+      Servers. Snapshot, Clone and restore operations don't involve data copying. Also, Exporting
+      the snapshot to another cluster doesn't have impact on the Region Servers. </para>
+    <para>Prior to version 0.94.6, the only way to backup or to clone a table is to use
+      CopyTable/ExportTable, or to copy all the hfiles in HDFS after disabling the table. The
+      disadvantages of these methods are that you can degrade region server performance (Copy/Export
+      Table) or you need to disable the table, that means no reads or writes; and this is usually
+      unacceptable. </para>
+    <section xml:id="ops.snapshots.configuration">
+      <title>Configuration</title>
+      <para>To turn on the snapshot support just set the <varname>hbase.snapshot.enabled</varname>
+        property to true. (Snapshots are enabled by default in 0.95+ and off by default in
+        0.94.6+)</para>
+      <programlisting>
   &lt;property>
     &lt;name>hbase.snapshot.enabled&lt;/name>
     &lt;value>true&lt;/value>
   &lt;/property>
         </programlisting>
-      </para>
     </section>
-    <section xml:id="ops.snapshots.takeasnapshot"><title>Take a Snapshot</title>
-      <para>You can take a snapshot of a table regardless of whether it is enabled or disabled.
-        The snapshot operation doesn't involve any data copying.
-        <programlisting>
-    $ ./bin/hbase shell
-    hbase> snapshot 'myTable', 'myTableSnapshot-122112'
-        </programlisting>
-      </para>
+    <section xml:id="ops.snapshots.takeasnapshot">
+      <title>Take a Snapshot</title>
+      <para>You can take a snapshot of a table regardless of whether it is enabled or disabled. The
+        snapshot operation doesn't involve any data copying.</para>
+      <screen>
+$ ./bin/hbase shell
+hbase> snapshot 'myTable', 'myTableSnapshot-122112'
+        </screen>
     </section>
-    <section xml:id="ops.snapshots.list"><title>Listing Snapshots</title>
-      <para>List all snapshots taken (by printing the names and relative information).
-        <programlisting>
-    $ ./bin/hbase shell
-    hbase> list_snapshots
-        </programlisting>
-      </para>
+    <section xml:id="ops.snapshots.list">
+      <title>Listing Snapshots</title>
+      <para>List all snapshots taken (by printing the names and relative information).</para>
+      <screen>
+$ ./bin/hbase shell
+hbase> list_snapshots
+        </screen>
     </section>
-    <section xml:id="ops.snapshots.delete"><title>Deleting Snapshots</title>
-      <para>You can remove a snapshot, and the files retained for that snapshot will be removed
-        if no longer needed.
-        <programlisting>
-    $ ./bin/hbase shell
-    hbase> delete_snapshot 'myTableSnapshot-122112'
-        </programlisting>
-      </para>
+    <section xml:id="ops.snapshots.delete">
+      <title>Deleting Snapshots</title>
+      <para>You can remove a snapshot, and the files retained for that snapshot will be removed if
+        no longer needed.</para>
+      <screen>
+$ ./bin/hbase shell
+hbase> delete_snapshot 'myTableSnapshot-122112'
+        </screen>
     </section>
-    <section xml:id="ops.snapshots.clone"><title>Clone a table from snapshot</title>
-      <para>From a snapshot you can create a new table (clone operation) with the same data
-      that you had when the snapshot was taken.
-      The clone operation, doesn't involve data copies, and a change to the cloned table
-      doesn't impact the snapshot or the original table.
-        <programlisting>
-    $ ./bin/hbase shell
-    hbase> clone_snapshot 'myTableSnapshot-122112', 'myNewTestTable'
-        </programlisting>
-      </para>
+    <section xml:id="ops.snapshots.clone">
+      <title>Clone a table from snapshot</title>
+      <para>From a snapshot you can create a new table (clone operation) with the same data that you
+        had when the snapshot was taken. The clone operation, doesn't involve data copies, and a
+        change to the cloned table doesn't impact the snapshot or the original table.</para>
+      <screen>
+$ ./bin/hbase shell
+hbase> clone_snapshot 'myTableSnapshot-122112', 'myNewTestTable'
+        </screen>
     </section>
-    <section xml:id="ops.snapshots.restore"><title>Restore a snapshot</title>
-      <para>The restore operation requires the table to be disabled, and the table will be
-      restored to the state at the time when the snapshot was taken,
-      changing both data and schema if required.
-        <programlisting>
-    $ ./bin/hbase shell
-    hbase> disable 'myTable'
-    hbase> restore_snapshot 'myTableSnapshot-122112'
-        </programlisting>
-      </para>
+    <section xml:id="ops.snapshots.restore">
+      <title>Restore a snapshot</title>
+      <para>The restore operation requires the table to be disabled, and the table will be restored
+        to the state at the time when the snapshot was taken, changing both data and schema if
+        required.</para>
+      <screen>
+$ ./bin/hbase shell
+hbase> disable 'myTable'
+hbase> restore_snapshot 'myTableSnapshot-122112'
+        </screen>
       <note>
-        <para>Since Replication works at log level and snapshots at file-system level,
-      after a restore, the replicas will be in a different state from the master.
-      If you want to use restore, you need to stop replication and redo the bootstrap.
-        </para>
+        <para>Since Replication works at log level and snapshots at file-system level, after a
+          restore, the replicas will be in a different state from the master. If you want to use
+          restore, you need to stop replication and redo the bootstrap. </para>
       </note>
-      <para>In case of partial data-loss due to misbehaving client, instead of a full restore
-      that requires the table to be disabled, you can clone the table from the snapshot
-      and use a Map-Reduce job to copy the data that you need, from the clone to the main one.
-      </para>
+      <para>In case of partial data-loss due to misbehaving client, instead of a full restore that
+        requires the table to be disabled, you can clone the table from the snapshot and use a
+        Map-Reduce job to copy the data that you need, from the clone to the main one. </para>
     </section>
-    <section xml:id="ops.snapshots.acls"><title>Snapshots operations and ACLs</title>
-    If you are using security with the AccessController Coprocessor (See <xref linkend="hbase.accesscontrol.configuration" />),
-    only a global administrator can take, clone, or restore a snapshot, and these actions do not capture the ACL rights.
-    This means that restoring a table preserves the ACL rights of the existing table,
-    while cloning a table creates a new table that has no ACL rights until the administrator adds them.
+    <section xml:id="ops.snapshots.acls">
+      <title>Snapshots operations and ACLs</title>
+      <para>If you are using security with the AccessController Coprocessor (See <xref
+          linkend="hbase.accesscontrol.configuration"/>), only a global administrator can take,
+        clone, or restore a snapshot, and these actions do not capture the ACL rights. This means
+        that restoring a table preserves the ACL rights of the existing table, while cloning a table
+        creates a new table that has no ACL rights until the administrator adds them.</para>
     </section>
-    <section xml:id="ops.snapshots.export"><title>Export to another cluster</title>
-      <para>The ExportSnapshot tool copies all the data related to a snapshot (hfiles, logs, snapshot metadata) to another cluster.
-        The tool executes a Map-Reduce job, similar to distcp, to copy files between the two clusters,
-        and since it works at file-system level the hbase cluster does not have to be online.
-        <para>To copy a snapshot called MySnapshot to an HBase cluster srv2 (hdfs:///srv2:8082/hbase) using 16 mappers:
-<programlisting>$ bin/hbase class org.apache.hadoop.hbase.snapshot.ExportSnapshot -snapshot MySnapshot -copy-to hdfs://srv2:8082/hbase -mappers 16</programlisting>
-        </para>
-      </para>
+    <section xml:id="ops.snapshots.export">
+      <title>Export to another cluster</title>
+      <para>The ExportSnapshot tool copies all the data related to a snapshot (hfiles, logs,
+        snapshot metadata) to another cluster. The tool executes a Map-Reduce job, similar to
+        distcp, to copy files between the two clusters, and since it works at file-system level the
+        hbase cluster does not have to be online.</para>
+      <para>To copy a snapshot called MySnapshot to an HBase cluster srv2 (hdfs:///srv2:8082/hbase)
+        using 16 mappers:</para>
+      <programlisting>$ bin/hbase class org.apache.hadoop.hbase.snapshot.ExportSnapshot -snapshot MySnapshot -copy-to hdfs://srv2:8082/hbase -mappers 16</programlisting>
     </section>
-  </section>  <!--  snapshots -->
+  </section>
+  <!--  snapshots -->
 
-  <section xml:id="ops.capacity"><title>Capacity Planning and Region Sizing</title>
-    <para>There are several considerations when planning the capacity for an HBase cluster and performing the initial configuration. Start with a solid understanding of how HBase handles data internally.</para>
-    <section xml:id="ops.capacity.nodes"><title>Node count and hardware/VM configuration</title>
-      <section xml:id="ops.capacity.nodes.datasize"><title>Physical data size</title>
-<para>Physical data size on disk is distinct from logical size of your data and is affected by the following:
-<itemizedlist>
-<listitem>Increased by HBase overhead
-<itemizedlist>
-<listitem>See <xref linkend="keyvalue" /> and <xref linkend="keysize" />. At least 24 bytes per key-value (cell), can be more. Small keys/values means more relative overhead.</listitem>
-<listitem>KeyValue instances are aggregated into blocks, which are indexed. Indexes also have to be stored. Blocksize is configurable on a per-ColumnFamily basis. See <xref linkend="regions.arch" />.</listitem>
-</itemizedlist></listitem>
-<listitem>Decreased by <xref linkend="compression" xrefstyle="template:compression" /> and data block encoding, depending on data. See also <ulink url="http://search-hadoop.com/m/lL12B1PFVhp1">this thread</ulink>. You might want to test what compression and encoding (if any) make sense for your data.</listitem>
-<listitem>Increased by size of region server <xref linkend="wal" xrefstyle="template:WAL" /> (usually fixed and negligible - less than half of RS memory size, per RS).</listitem>
-<listitem>Increased by HDFS replication - usually x3.</listitem>
-</itemizedlist></para>
-<para>Aside from the disk space necessary to store the data, one RS may not be able to serve arbitrarily large amounts of data due to some practical limits on region count and size (see <xref linkend="ops.capacity.regions" xrefstyle="template:below" />).</para>
-      </section> <!-- ops.capacity.nodes.datasize -->
-      <section xml:id="ops.capacity.nodes.throughput"><title>Read/Write throughput</title>
-<para>Number of nodes can also be driven by required thoughput for reads and/or writes. The  throughput one can get per node depends a lot on data (esp. key/value sizes) and request patterns, as well as node and system configuration. Planning should be done for peak load if it is likely that the load would be the main driver of the increase of the node count. PerformanceEvaluation and <xref linkend="ycsb" xrefstyle="template:YCSB" /> tools can be used to test single node or a test cluster.</para>
-<para>For write, usually 5-15Mb/s per RS can be expected, since every region server has only one active WAL. There's no good estimate for reads, as it depends vastly on data, requests, and cache hit rate. <xref linkend="perf.casestudy" /> might be helpful.</para>
-      </section> <!-- ops.capacity.nodes.throughput -->
-      <section xml:id="ops.capacity.nodes.gc"><title>JVM GC limitations</title>
-<para>RS cannot currently utilize very large heap due to cost of GC. There's also no good way of running multiple RS-es per server (other than running several VMs per machine). Thus, ~20-24Gb or less memory dedicated to one RS is recommended. GC tuning is required for large heap sizes. See <xref linkend="gcpause" />, <xref linkend="trouble.log.gc" /> and elsewhere (TODO: where?)</para>
-      </section> <!-- ops.capacity.nodes.gc -->
-    </section> <!-- ops.capacity.nodes -->
-    <section xml:id="ops.capacity.regions"><title>Determining region count and size</title>
-<para>Generally less regions makes for a smoother running cluster (you can always manually split the big regions later (if necessary) to spread the data, or request load, over the cluster); 20-200 regions per RS is a reasonable range. The number of regions cannot be configured directly (unless you go for fully <xref linkend="disable.splitting" xrefstyle="template:manual splitting" />); adjust the region size to achieve the target region size given table size.</para>
-<para>When configuring regions for multiple tables, note that most region settings can be set on a per-table basis via <link xlink:href="http://hbase.apache.org/apidocs/org/apache/hadoop/hbase/HTableDescriptor.html">HTableDescriptor</link>, as well as shell commands. These settings will override the ones in <varname>hbase-site.xml</varname>. That is useful if your tables have different workloads/use cases.</para>
-<para>Also note that in the discussion of region sizes here, <emphasis role="bold">HDFS replication factor is not (and should not be) taken into account, whereas other factors <xref linkend="ops.capacity.nodes.datasize" xrefstyle="template:above" /> should be.</emphasis> So, if your data is compressed and replicated 3 ways by HDFS, "9 Gb region" means 9 Gb of compressed data. HDFS replication factor only affects your disk usage and is invisible to most HBase code.</para>
-      <section xml:id="ops.capacity.regions.count"><title>Number of regions per RS - upper bound</title>
-<para>In production scenarios, where you have a lot of data, you are normally concerned with the maximum number of regions you can have per server. <xref linkend="too_many_regions" /> has technical discussion on the subject; in short, maximum number of regions is mostly determined by memstore memory usage. Each region has its own memstores; these grow up to a configurable size; usually in 128-256Mb range, see <xref linkend="hbase.hregion.memstore.flush.size" />. There's one memstore per column family (so there's only one per region if there's one CF in the table). RS dedicates some fraction of total memory (see <xref linkend="hbase.regionserver.global.memstore.size" />) to region memstores. If this memory is exceeded (too much memstore usage), undesirable consequences such as unresponsive server, or later compaction storms, can result. Thus, a good starting point for the number of regions per RS (assuming one table) is <programlisting>(RS memory)*(total memstore fraction)/((memstore size)*(# column families))</programlisting>
-E.g. if RS has 16Gb RAM, with default settings, it is 16384*0.4/128 ~ 51 regions per RS is a starting point. The formula can be extended to multiple tables; if they all have the same configuration, just use total number of families.</para>
-<para>This number can be adjusted; the formula above assumes all your regions are filled at approximately the same rate. If only a fraction of your regions are going to be actively written to, you can divide the result by that fraction to get a larger region count. Then, even if all regions are written to, all region memstores are not filled evenly, and eventually jitter appears even if they are (due to limited number of concurrent flushes). Thus, one can have as many as 2-3 times more regions than the starting point; however, increased numbers carry increased risk.</para>
-<para>For write-heavy workload, memstore fraction can be increased in configuration at the expense of block cache; this will also allow one to have more regions.</para>
-      </section> <!-- ops.capacity.regions.count -->
-      <section xml:id="ops.capacity.regions.mincount"><title>Number of regions per RS - lower bound</title>
-<para>HBase scales by having regions across many servers. Thus if you have 2 regions for 16GB data, on a 20 node machine your data will be concentrated on just a few machines - nearly the entire        cluster will be idle. This really can't be stressed enough, since a common problem is loading 200MB data into HBase and then wondering why your awesome 10 node cluster isn't doing anything.</para>
-<para>On the other hand, if you have a very large amount of data, you may also want to go for a larger number of regions to avoid having regions that are too large.</para>
-      </section> <!-- ops.capacity.regions.mincount -->
-      <section xml:id="ops.capacity.regions.size"><title>Maximum region size</title>
-<para>For large tables in production scenarios, maximum region size is mostly limited by compactions - very large compactions, esp. major, can degrade cluster performance. Currently, the recommended maximum region size is 10-20Gb, and 5-10Gb is optimal. For older 0.90.x codebase, the upper-bound of regionsize is about 4Gb, with a default of 256Mb.</para>
-<para>The size at which the region is split into two is generally configured via <xref linkend="hbase.hregion.max.filesize" />; for details, see <xref linkend="arch.region.splits" />.</para>
-<para>If you cannot estimate the size of your tables well, when starting off, it's probably best to stick to the default region size, perhaps going smaller for hot tables (or manually split hot regions to spread the load over the cluster), or go with larger region sizes if your cell sizes tend to be largish (100k and up).</para>
-<para>In HBase 0.98, experimental stripe compactions feature was added that would allow for larger regions, especially for log data. See <xref linkend="ops.stripe" />.</para>
-      </section> <!-- ops.capacity.regions.size -->
-      <section xml:id="ops.capacity.regions.total"><title>Total data size per region server</title>
-<para>According to above numbers for region size and number of regions per region server, in an optimistic estimate 10 GB x 100 regions per RS will give up to 1TB served per region server, which is in line with some of the reported multi-PB use cases. However, it is important to think about the data vs cache size ratio at the RS level. With 1TB of data per server and 10 GB block cache, only 1% of the data will be cached, which may barely cover all block indices.</para>
-      </section> <!-- ops.capacity.regions.total -->
-    </section> <!-- ops.capacity.regions -->
-    <section xml:id="ops.capacity.config"><title>Initial configuration and tuning</title>
-<para>First, see <xref linkend="important_configurations" />. Note that some configurations, more than others, depend on specific scenarios. Pay special attention to 
-<itemizedlist>
-<listitem><xref linkend="hbase.regionserver.handler.count" /> - request handler thread count, vital for high-throughput workloads.</listitem>
-<listitem><xref linkend="config.wals" /> - the blocking number of WAL files depends on your memstore configuration and should be set accordingly to prevent potential blocking when doing high volume of writes.</listitem>
-</itemizedlist></para>
-<para>Then, there are some considerations when setting up your cluster and tables.</para>
-      <section xml:id="ops.capacity.config.compactions"><title>Compactions</title>
-<para>Depending on read/write volume and latency requirements, optimal compaction settings may be different. See <xref linkend="compaction" /> for some details.</para>
-<para>When provisioning for large data sizes, however, it's good to keep in mind that compactions can affect write throughput. Thus, for write-intensive workloads, you may opt for less frequent compactions and more store files per regions. Minimum number of files for compactions (<varname>hbase.hstore.compaction.min</varname>) can be set to higher value; <xref linkend="hbase.hstore.blockingStoreFiles" /> should also be increased, as more files might accumulate in such case. You may also consider manually managing compactions: <xref linkend="managed.compactions" /></para>
-      </section> <!-- ops.capacity.config.compactions -->
-      <section xml:id="ops.capacity.config.presplit"><title>Pre-splitting the table</title>
-<para>Based on the target number of the regions per RS (see <xref linkend="ops.capacity.regions.count" xrefstyle="template:above" />) and number of RSes, one can pre-split the table at creation time. This would both avoid some costly splitting as the table starts to fill up, and ensure that the table starts out already distributed across many servers.</para>
-<para>If the table is expected to grow large enough to justify that, at least one region per RS should be created. It is not recommended to split immediately into the full target number of regions (e.g. 50 * number of RSes), but a low intermediate value can be chosen. For multiple tables, it is recommended to be conservative with presplitting (e.g. pre-split 1 region per RS at most), especially if you don't know how much each table will grow. If you split too much, you may end up with too many regions, with some tables having too many small regions.</para>
-<para>For pre-splitting howto, see <xref linkend="precreate.regions" />.</para>
-      </section> <!-- ops.capacity.config.presplit -->
-    </section> <!-- ops.capacity.config -->
-  </section> <!-- ops.capacity -->
-  <section xml:id="table.rename"><title>Table Rename</title>
-      <para>In versions 0.90.x of hbase and earlier, we had a simple script that would rename the hdfs
-          table directory and then do an edit of the .META. table replacing all mentions of the old
-          table name with the new.  The script was called <command>./bin/rename_table.rb</command>.
-          The script was deprecated and removed mostly because it was unmaintained and the operation
-          performed by the script was brutal.
-      </para>
-      <para>
-          As of hbase 0.94.x, you can use the snapshot facility renaming a table.  Here is how you would
-do it using the hbase shell:
-<programlisting>hbase shell> disable 'tableName'
+  <section xml:id="ops.capacity">
+    <title>Capacity Planning and Region Sizing</title>
+    <para>There are several considerations when planning the capacity for an HBase cluster and
+      performing the initial configuration. Start with a solid understanding of how HBase handles
+      data internally.</para>
+    <section xml:id="ops.capacity.nodes">
+      <title>Node count and hardware/VM configuration</title>
+      <section xml:id="ops.capacity.nodes.datasize">
+        <title>Physical data size</title>
+        <para>Physical data size on disk is distinct from logical size of your data and is affected
+          by the following: </para>
+        <itemizedlist>
+          <listitem>
+            <para>Increased by HBase overhead</para>
+            <itemizedlist>
+              <listitem>
+                <para>See <xref linkend="keyvalue"/> and <xref linkend="keysize"/>. At least 24
+                  bytes per key-value (cell), can be more. Small keys/values means more relative
+                  overhead.</para>
+              </listitem>
+              <listitem>
+                <para>KeyValue instances are aggregated into blocks, which are indexed. Indexes also
+                  have to be stored. Blocksize is configurable on a per-ColumnFamily basis. See
+                    <xref linkend="regions.arch"/>.</para>
+              </listitem>
+            </itemizedlist>
+          </listitem>
+          <listitem>
+            <para>Decreased by <xref linkend="compression" xrefstyle="template:compression"/> and
+              data block encoding, depending on data. See also <link
+                xlink:href="http://search-hadoop.com/m/lL12B1PFVhp1">this thread</link>. You might
+              want to test what compression and encoding (if any) make sense for your data.</para>
+          </listitem>
+          <listitem>
+            <para>Increased by size of region server <xref linkend="wal" xrefstyle="template:WAL"/>
+              (usually fixed and negligible - less than half of RS memory size, per RS).</para>
+          </listitem>
+          <listitem>
+            <para>Increased by HDFS replication - usually x3.</para>
+          </listitem>
+        </itemizedlist>
+        <para>Aside from the disk space necessary to store the data, one RS may not be able to serve
+          arbitrarily large amounts of data due to some practical limits on region count and size
+          (see <xref linkend="ops.capacity.regions" xrefstyle="template:below"/>).</para>
+      </section>
+      <!-- ops.capacity.nodes.datasize -->
+      <section xml:id="ops.capacity.nodes.throughput">
+        <title>Read/Write throughput</title>
+        <para>Number of nodes can also be driven by required thoughput for reads and/or writes. The
+          throughput one can get per node depends a lot on data (esp. key/value sizes) and request
+          patterns, as well as node and system configuration. Planning should be done for peak load
+          if it is likely that the load would be the main driver of the increase of the node count.
+          PerformanceEvaluation and <xref linkend="ycsb" xrefstyle="template:YCSB"/> tools can be
+          used to test single node or a test cluster.</para>
+        <para>For write, usually 5-15Mb/s per RS can be expected, since every region server has only
+          one active WAL. There's no good estimate for reads, as it depends vastly on data,
+          requests, and cache hit rate. <xref linkend="perf.casestudy"/> might be helpful.</para>
+      </section>
+      <!-- ops.capacity.nodes.throughput -->
+      <section xml:id="ops.capacity.nodes.gc">
+        <title>JVM GC limitations</title>
+        <para>RS cannot currently utilize very large heap due to cost of GC. There's also no good
+          way of running multiple RS-es per server (other than running several VMs per machine).
+          Thus, ~20-24Gb or less memory dedicated to one RS is recommended. GC tuning is required
+          for large heap sizes. See <xref linkend="gcpause"/>, <xref linkend="trouble.log.gc"/> and
+          elsewhere (TODO: where?)</para>
+      </section>
+      <!-- ops.capacity.nodes.gc -->
+    </section>
+    <!-- ops.capacity.nodes -->
+    <section xml:id="ops.capacity.regions">
+      <title>Determining region count and size</title>
+      <para>Generally less regions makes for a smoother running cluster (you can always manually
+        split the big regions later (if necessary) to spread the data, or request load, over the
+        cluster); 20-200 regions per RS is a reasonable range. The number of regions cannot be
+        configured directly (unless you go for fully <xref linkend="disable.splitting"
+          xrefstyle="template:manual splitting"/>); adjust the region size to achieve the target
+        region size given table size.</para>
+      <para>When configuring regions for multiple tables, note that most region settings can be set
+        on a per-table basis via <link
+          xlink:href="http://hbase.apache.org/apidocs/org/apache/hadoop/hbase/HTableDescriptor.html"
+          >HTableDescriptor</link>, as well as shell commands. These settings will override the ones
+        in <varname>hbase-site.xml</varname>. That is useful if your tables have different
+        workloads/use cases.</para>
+      <para>Also note that in the discussion of region sizes here, <emphasis role="bold">HDFS
+          replication factor is not (and should not be) taken into account, whereas other factors
+            <xref linkend="ops.capacity.nodes.datasize" xrefstyle="template:above"/> should
+          be.</emphasis> So, if your data is compressed and replicated 3 ways by HDFS, "9 Gb region"
+        means 9 Gb of compressed data. HDFS replication factor only affects your disk usage and is
+        invisible to most HBase code.</para>
+      <section xml:id="ops.capacity.regions.count">
+        <title>Number of regions per RS - upper bound</title>
+        <para>In production scenarios, where you have a lot of data, you are normally concerned with
+          the maximum number of regions you can have per server. <xref linkend="too_many_regions"/>
+          has technical discussion on the subject; in short, maximum number of regions is mostly
+          determined by memstore memory usage. Each region has its own memstores; these grow up to a
+          configurable size; usually in 128-256Mb range, see <xref
+            linkend="hbase.hregion.memstore.flush.size"/>. There's one memstore per column family
+          (so there's only one per region if there's one CF in the table). RS dedicates some
+          fraction of total memory (see <xref linkend="hbase.regionserver.global.memstore.size"/>)
+          to region memstores. If this memory is exceeded (too much memstore usage), undesirable
+          consequences such as unresponsive server, or later compaction storms, can result. Thus, a
+          good starting point for the number of regions per RS (assuming one table) is:</para>
+
+        <programlisting>(RS memory)*(total memstore fraction)/((memstore size)*(# column families))</programlisting>
+        <para> E.g. if RS has 16Gb RAM, with default settings, it is 16384*0.4/128 ~ 51 regions per
+          RS is a starting point. The formula can be extended to multiple tables; if they all have
+          the same configuration, just use total number of families.</para>
+        <para>This number can be adjusted; the formula above assumes all your regions are filled at
+          approximately the same rate. If only a fraction of your regions are going to be actively
+          written to, you can divide the result by that fraction to get a larger region count. Then,
+          even if all regions are written to, all region memstores are not filled evenly, and
+          eventually jitter appears even if they are (due to limited number of concurrent flushes).
+          Thus, one can have as many as 2-3 times more regions than the starting point; however,
+          increased numbers carry increased risk.</para>
+        <para>For write-heavy workload, memstore fraction can be increased in configuration at the
+          expense of block cache; this will also allow one to have more regions.</para>
+      </section>
+      <!-- ops.capacity.regions.count -->
+      <section xml:id="ops.capacity.regions.mincount">
+        <title>Number of regions per RS - lower bound</title>
+        <para>HBase scales by having regions across many servers. Thus if you have 2 regions for
+          16GB data, on a 20 node machine your data will be concentrated on just a few machines -
+          nearly the entire cluster will be idle. This really can't be stressed enough, since a
+          common problem is loading 200MB data into HBase and then wondering why your awesome 10
+          node cluster isn't doing anything.</para>
+        <para>On the other hand, if you have a very large amount of data, you may also want to go
+          for a larger number of regions to avoid having regions that are too large.</para>
+      </section>
+      <!-- ops.capacity.regions.mincount -->
+      <section xml:id="ops.capacity.regions.size">
+        <title>Maximum region size</title>
+        <para>For large tables in production scenarios, maximum region size is mostly limited by
+          compactions - very large compactions, esp. major, can degrade cluster performance.
+          Currently, the recommended maximum region size is 10-20Gb, and 5-10Gb is optimal. For
+          older 0.90.x codebase, the upper-bound of regionsize is about 4Gb, with a default of
+          256Mb.</para>
+        <para>The size at which the region is split into two is generally configured via <xref
+            linkend="hbase.hregion.max.filesize"/>; for details, see <xref
+            linkend="arch.region.splits"/>.</para>
+        <para>If you cannot estimate the size of your tables well, when starting off, it's probably
+          best to stick to the default region size, perhaps going smaller for hot tables (or
+          manually split hot regions to spread the load over the cluster), or go with larger region
+          sizes if your cell sizes tend to be largish (100k and up).</para>
+        <para>In HBase 0.98, experimental stripe compactions feature was added that would allow for
+          larger regions, especially for log data. See <xref linkend="ops.stripe"/>.</para>
+      </section>
+      <!-- ops.capacity.regions.size -->
+      <section xml:id="ops.capacity.regions.total">
+        <title>Total data size per region server</title>
+        <para>According to above numbers for region size and number of regions per region server, in
+          an optimistic estimate 10 GB x 100 regions per RS will give up to 1TB served per region
+          server, which is in line with some of the reported multi-PB use cases. However, it is
+          important to think about the data vs cache size ratio at the RS level. With 1TB of data
+          per server and 10 GB block cache, only 1% of the data will be cached, which may barely
+          cover all block indices.</para>
+      </section>
+      <!-- ops.capacity.regions.total -->
+    </section>
+    <!-- ops.capacity.regions -->
+    <section xml:id="ops.capacity.config">
+      <title>Initial configuration and tuning</title>
+      <para>First, see <xref linkend="important_configurations"/>. Note that some configurations,
+        more than others, depend on specific scenarios. Pay special attention to:</para>
+      <itemizedlist>
+        <listitem>
+          <para><xref linkend="hbase.regionserver.handler.count"/> - request handler thread count,
+            vital for high-throughput workloads.</para>
+        </listitem>
+        <listitem>
+          <para><xref linkend="config.wals"/> - the blocking number of WAL files depends on your
+            memstore configuration and should be set accordingly to prevent potential blocking when
+            doing high volume of writes.</para>
+        </listitem>
+      </itemizedlist>
+      <para>Then, there are some considerations when setting up your cluster and tables.</para>
+      <section xml:id="ops.capacity.config.compactions">
+        <title>Compactions</title>
+        <para>Depending on read/write volume and latency requirements, optimal compaction settings
+          may be different. See <xref linkend="compaction"/> for some details.</para>
+        <para>When provisioning for large data sizes, however, it's good to keep in mind that
+          compactions can affect write throughput. Thus, for write-intensive workloads, you may opt
+          for less frequent compactions and more store files per regions. Minimum number of files
+          for compactions (<varname>hbase.hstore.compaction.min</varname>) can be set to higher
+          value; <xref linkend="hbase.hstore.blockingStoreFiles"/> should also be increased, as more
+          files might accumulate in such case. You may also consider manually managing compactions:
+            <xref linkend="managed.compactions"/></para>
+      </section>
+      <!-- ops.capacity.config.compactions -->
+      <section xml:id="ops.capacity.config.presplit">
+        <title>Pre-splitting the table</title>
+        <para>Based on the target number of the regions per RS (see <xref
+            linkend="ops.capacity.regions.count" xrefstyle="template:above"/>) and number of RSes,
+          one can pre-split the table at creation time. This would both avoid some costly splitting
+          as the table starts to fill up, and ensure that the table starts out already distributed
+          across many servers.</para>
+        <para>If the table is expected to grow large enough to justify that, at least one region per
+          RS should be created. It is not recommended to split immediately into the full target
+          number of regions (e.g. 50 * number of RSes), but a low intermediate value can be chosen.
+          For multiple tables, it is recommended to be conservative with presplitting (e.g.
+          pre-split 1 region per RS at most), especially if you don't know how much each table will
+          grow. If you split too much, you may end up with too many regions, with some tables having
+          too many small regions.</para>
+        <para>For pre-splitting howto, see <xref linkend="precreate.regions"/>.</para>
+      </section>
+      <!-- ops.capacity.config.presplit -->
+    </section>
+    <!-- ops.capacity.config -->
+  </section>
+  <!-- ops.capacity -->
+  <section xml:id="table.rename">
+    <title>Table Rename</title>
+    <para>In versions 0.90.x of hbase and earlier, we had a simple script that would rename the hdfs
+      table directory and then do an edit of the .META. table replacing all mentions of the old
+      table name with the new. The script was called <command>./bin/rename_table.rb</command>. The
+      script was deprecated and removed mostly because it was unmaintained and the operation
+      performed by the script was brutal. </para>
+    <para> As of hbase 0.94.x, you can use the snapshot facility renaming a table. Here is how you
+      would do it using the hbase shell:</para>
+    <programlisting>hbase shell> disable 'tableName'
 hbase shell> snapshot 'tableName', 'tableSnapshot'
 hbase shell> clone_snapshot 'tableSnapshot', 'newTableName'
 hbase shell> delete_snapshot 'tableSnapshot'
 hbase shell> drop 'tableName'</programlisting>
-or in code it would be as follows:
-<programlisting>void rename(HBaseAdmin admin, String oldTableName, String newTableName) {
-    String snapshotName = randomName();
-    admin.disableTable(oldTableName);
-    admin.snapshot(snapshotName, oldTableName);
-    admin.cloneSnapshot(snapshotName, newTableName);
-    admin.deleteSnapshot(snapshotName);
-    admin.deleteTable(oldTableName);
+    <para>or in code it would be as follows:</para>
+    <programlisting>void rename(HBaseAdmin admin, String oldTableName, String newTableName) {
+String snapshotName = randomName();
+admin.disableTable(oldTableName);
+admin.snapshot(snapshotName, oldTableName);
+admin.cloneSnapshot(snapshotName, newTableName);
+admin.deleteSnapshot(snapshotName);
+admin.deleteTable(oldTableName);
 }</programlisting>
-      </para>
+
   </section>
 
 </chapter>
diff --git a/src/main/docbkx/performance.xml b/src/main/docbkx/performance.xml
index 854e7c9fa1d..a56c52293f8 100644
--- a/src/main/docbkx/performance.xml
+++ b/src/main/docbkx/performance.xml
@@ -51,9 +51,9 @@
     <para>
     Important items to consider:
         <itemizedlist>
-          <listitem>Switching capacity of the device</listitem>
-          <listitem>Number of systems connected</listitem>
-          <listitem>Uplink capacity</listitem>
+          <listitem><para>Switching capacity of the device</para></listitem>
+          <listitem><para>Number of systems connected</para></listitem>
+          <listitem><para>Uplink capacity</para></listitem>
         </itemizedlist>
     </para>
     <section xml:id="perf.network.1switch">
@@ -71,9 +71,9 @@
       </para>
       <para>Mitigation of this issue is fairly simple and can be accomplished in multiple ways:
       <itemizedlist>
-        <listitem>Use appropriate hardware for the scale of the cluster which you're attempting to build.</listitem>
-        <listitem>Use larger single switch configurations i.e. single 48 port as opposed to 2x 24 port</listitem>
-        <listitem>Configure port trunking for uplinks to utilize multiple interfaces to increase cross switch bandwidth.</listitem>
+        <listitem><para>Use appropriate hardware for the scale of the cluster which you're attempting to build.</para></listitem>
+        <listitem><para>Use larger single switch configurations i.e. single 48 port as opposed to 2x 24 port</para></listitem>
+        <listitem><para>Configure port trunking for uplinks to utilize multiple interfaces to increase cross switch bandwidth.</para></listitem>
       </itemizedlist>
       </para>
     </section>
@@ -81,8 +81,8 @@
       <title>Multiple Racks</title>
       <para>Multiple rack configurations carry the same potential issues as multiple switches, and can suffer performance degradation from two main areas:
          <itemizedlist>
-           <listitem>Poor switch capacity performance</listitem>
-           <listitem>Insufficient uplink to another rack</listitem>
+           <listitem><para>Poor switch capacity performance</para></listitem>
+           <listitem><para>Insufficient uplink to another rack</para></listitem>
          </itemizedlist>
       If the the switches in your rack have appropriate switching capacity to handle all the hosts at full speed, the next most likely issue will be caused by homing
       more of your cluster across racks.  The easiest way to avoid issues when spanning multiple racks is to use port trunking to create a bonded uplink to other racks.
diff --git a/src/main/docbkx/schema_design.xml b/src/main/docbkx/schema_design.xml
index 482d3d12a4c..a79f1754975 100644
--- a/src/main/docbkx/schema_design.xml
+++ b/src/main/docbkx/schema_design.xml
@@ -32,7 +32,7 @@
           the various non-rdbms datastores is Ian Varley's Master thesis,
           <link xlink:href="http://ianvarley.com/UT/MR/Varley_MastersReport_Full_2009-08-07.pdf">No Relation: The Mixed Blessings of Non-Relational Databases</link>.
           Recommended.  Also, read <xref linkend="keyvalue"/> for how HBase stores data internally, and the section on 
-          <xref linkend="schema.casestudies">HBase Schema Design Case Studies</xref>.
+          <xref linkend="schema.casestudies"/>.
       </para>      
   <section xml:id="schema.creation">
   <title>
@@ -41,7 +41,7 @@
   <para>HBase schemas can be created or updated with <xref linkend="shell" />
       or by using <link xlink:href="http://hbase.apache.org/apidocs/org/apache/hadoop/hbase/client/HBaseAdmin.html">HBaseAdmin</link> in the Java API.
       </para>
-      <para>Tables must be disabled when making ColumnFamily modifications, for example..
+      <para>Tables must be disabled when making ColumnFamily modifications, for example:</para>
       <programlisting>
 Configuration config = HBaseConfiguration.create();
 HBaseAdmin admin = new HBaseAdmin(conf);
@@ -56,7 +56,7 @@ admin.modifyColumn(table, cf2);    // modifying existing ColumnFamily
 
 admin.enableTable(table);
       </programlisting>
-      </para>See <xref linkend="client_dependencies"/> for more information about configuring client connections.
+      <para>See <xref linkend="client_dependencies"/> for more information about configuring client connections.</para>
       <para>Note:  online schema changes are supported in the 0.92.x codebase, but the 0.90.x codebase requires the table
       to be disabled.
       </para>
@@ -98,7 +98,7 @@ admin.enableTable(table);
     Monotonically Increasing Row Keys/Timeseries Data
     </title>
     <para>
-      In the HBase chapter of Tom White's book <link xlink:url="http://oreilly.com/catalog/9780596521981">Hadoop: The Definitive Guide</link> (O'Reilly) there is a an optimization note on watching out for a phenomenon where an import process walks in lock-step with all clients in concert pounding one of the table's regions (and thus, a single node), then moving onto the next region, etc.  With monotonically increasing row-keys (i.e., using a timestamp), this will happen.  See this comic by IKai Lan on why monotonically increasing row keys are problematic in BigTable-like datastores:
+      In the HBase chapter of Tom White's book <link xlink:href="http://oreilly.com/catalog/9780596521981">Hadoop: The Definitive Guide</link> (O'Reilly) there is a an optimization note on watching out for a phenomenon where an import process walks in lock-step with all clients in concert pounding one of the table's regions (and thus, a single node), then moving onto the next region, etc.  With monotonically increasing row-keys (i.e., using a timestamp), this will happen.  See this comic by IKai Lan on why monotonically increasing row keys are problematic in BigTable-like datastores:
       <link xlink:href="http://ikaisays.com/2011/01/25/app-engine-datastore-tip-monotonically-increasing-values-are-bad/">monotonically increasing values are bad</link>.  The pile-up on a single region brought on
       by monotonically increasing keys can be mitigated by randomizing the input records to not be in sorted order, but in general it's best to avoid using a timestamp or a sequence (e.g. 1, 2, 3) as the row-key.
     </para>
@@ -107,7 +107,7 @@ admin.enableTable(table);
     successful example.  It has a page describing the <link xlink:href=" http://opentsdb.net/schema.html">schema</link> it uses in
     HBase.  The key format in OpenTSDB is effectively [metric_type][event_timestamp], which would appear at first glance to contradict the previous advice about not using a timestamp as the key.  However, the difference is that the timestamp is not in the <emphasis>lead</emphasis> position of the key, and the design assumption is that there are dozens or hundreds (or more) of different metric types.  Thus, even with a continual stream of input data with a mix of metric types, the Puts are distributed across various points of regions in the table.
    </para>
-   <para>See <xref linkend="schema.casestudies">HBase Schema Design Case Studies</xref> for some rowkey design examples.
+   <para>See <xref linkend="schema.casestudies"/> for some rowkey design examples.
    </para>
   </section>
   <section xml:id="keysize">
@@ -119,7 +119,7 @@ admin.enableTable(table);
           are large, especially compared to the size of the cell value, then
           you may run up against some interesting scenarios.  One such is
           the case described by Marc Limotte at the tail of
-          <link xlink:url="https://issues.apache.org/jira/browse/HBASE-3551?page=com.atlassian.jira.plugin.system.issuetabpanels:comment-tabpanel&amp;focusedCommentId=13005272#comment-13005272">HBASE-3551</link>
+          <link xlink:href="https://issues.apache.org/jira/browse/HBASE-3551?page=com.atlassian.jira.plugin.system.issuetabpanels:comment-tabpanel&amp;focusedCommentId=13005272#comment-13005272">HBASE-3551</link>
           (recommended!).
           Therein, the indices that are kept on HBase storefiles (<xref linkend="hfile" />)
                   to facilitate random access may end up occupyng large chunks of the HBase
@@ -213,7 +213,7 @@ COLUMN                                        CELL
     <para>The most recent value for [key] in a table can be found by performing a Scan for [key] and obtaining the first record.  Since HBase keys
     are in sorted order, this key sorts before any older row-keys for [key] and thus is first.
     </para>
-    <para>This technique would be used instead of using <xref linkend="schema.versions">HBase Versioning</xref> where the intent is to hold onto all versions
+    <para>This technique would be used instead of using <xref linkend="schema.versions"/> where the intent is to hold onto all versions
     "forever" (or a very long time) and at the same time quickly obtain access to any other version by using the same Scan technique.
     </para>
     </section>
@@ -335,11 +335,11 @@ public static byte[][] getHexSplits(String startKey, String endKey, int numRegio
   <link xlink:href="http://hbase.apache.org/apidocs/org/apache/hadoop/hbase/client/Result.html">Result</link>, so anything that can be
   converted to an array of bytes can be stored as a value.  Input could be strings, numbers, complex objects, or even images as long as they can rendered as bytes.
   </para>
-  <para>There are practical limits to the size of values (e.g., storing 10-50MB objects in HBase
-      would probably be too much to ask); search the mailing list for conversations on this topic.
-      All rows in HBase conform to the <xref linkend="datamodel">datamodel</xref>, and that includes
-      versioning. Take that into consideration when making your design, as well as block size for
-      the ColumnFamily. </para>
+  <para>There are practical limits to the size of values (e.g., storing 10-50MB objects in HBase would probably be too much to ask);
+  search the mailling list for conversations on this topic. All rows in HBase conform to the <xref linkend="datamodel"/>, and
+  that includes versioning.  Take that into consideration when making your design, as well as block size for the ColumnFamily.
+  </para>
+
     <section xml:id="counters">
       <title>Counters</title>
       <para>
@@ -389,10 +389,10 @@ public static byte[][] getHexSplits(String startKey, String endKey, int numRegio
   </para>
   <para>There is no single answer on the best way to handle this because it depends on...
    <itemizedlist>
-       <listitem>Number of users</listitem>
-       <listitem>Data size and data arrival rate</listitem>
-       <listitem>Flexibility of reporting requirements (e.g., completely ad-hoc date selection vs. pre-configured ranges) </listitem>
-       <listitem>Desired execution speed of query (e.g., 90 seconds may be reasonable to some for an ad-hoc report, whereas it may be too long for others) </listitem>
+       <listitem><para>Number of users</para></listitem>
+       <listitem><para>Data size and data arrival rate</para></listitem>
+       <listitem><para>Flexibility of reporting requirements (e.g., completely ad-hoc date selection vs. pre-configured ranges) </para></listitem>
+       <listitem><para>Desired execution speed of query (e.g., 90 seconds may be reasonable to some for an ad-hoc report, whereas it may be too long for others) </para></listitem>
    </itemizedlist>
    ... and solutions are also influenced by the size of the cluster and how much processing power you have to throw at the solution.
    Common techniques are in sub-sections below.  This is a comprehensive, but not exhaustive, list of approaches.
@@ -455,26 +455,26 @@ public static byte[][] getHexSplits(String startKey, String endKey, int numRegio
    can be approached.  Note:  this is just an illustration of potential approaches, not an exhaustive list. 
    Know your data, and know your processing requirements.
   </para>  
-  <para>It is highly recommended that you read the rest of the <xref linkend="schema">Schema Design Chapter</xref> first, before reading
+  <para>It is highly recommended that you read the rest of the <xref linkend="schema"/> first, before reading
   these case studies.
   </para>
   <para>Thee following case studies are described:    
       <itemizedlist>
-         <listitem>Log Data / Timeseries Data</listitem>
-         <listitem>Log Data / Timeseries on Steroids</listitem>
-         <listitem>Customer/Order</listitem>
-         <listitem>Tall/Wide/Middle Schema Design</listitem>
-         <listitem>List Data</listitem>
+         <listitem><para>Log Data / Timeseries Data</para></listitem>
+         <listitem><para>Log Data / Timeseries on Steroids</para></listitem>
+         <listitem><para>Customer/Order</para></listitem>
+         <listitem><para>Tall/Wide/Middle Schema Design</para></listitem>
+         <listitem><para>List Data</para></listitem>
      </itemizedlist> 
   </para>
     <section xml:id="schema.casestudies.log-timeseries">
       <title>Case Study - Log Data and Timeseries Data</title>
       <para>Assume that the following data elements are being collected.
         <itemizedlist>
-          <listitem>Hostname</listitem>
-          <listitem>Timestamp</listitem>
-          <listitem>Log event</listitem>
-          <listitem>Value/message</listitem>
+          <listitem><para>Hostname</para></listitem>
+          <listitem><para>Timestamp</para></listitem>
+          <listitem><para>Log event</para></listitem>
+          <listitem><para>Value/message</para></listitem>
         </itemizedlist>
         We can store them in an HBase table called LOG_DATA, but what will the rowkey be?  
        From these attributes the rowkey will be some combination of hostname, timestamp, and log-event - but what specifically?        
@@ -531,9 +531,9 @@ long bucket = timestamp % numBuckets;
         </para>
         <para>Composite Rowkey With Hashes:  
            <itemizedlist>
-             <listitem>[MD5 hash of hostname] = 16 bytes</listitem>
-             <listitem>[MD5 hash of event-type] = 16 bytes</listitem>
-             <listitem>[timestamp] = 8 bytes</listitem>
+             <listitem><para>[MD5 hash of hostname] = 16 bytes</para></listitem>
+             <listitem><para>[MD5 hash of event-type] = 16 bytes</para></listitem>
+             <listitem><para>[timestamp] = 8 bytes</para></listitem>
            </itemizedlist>
         </para>
         <para>Composite Rowkey With Numeric Substitution: 
@@ -541,17 +541,17 @@ long bucket = timestamp % numBuckets;
         <para>For this approach another lookup table would be needed in addition to LOG_DATA, called LOG_TYPES.  
         The rowkey of LOG_TYPES would be:
 		  <itemizedlist>
-             <listitem>[type]  (e.g., byte indicating hostname vs. event-type)</listitem>
-             <listitem>[bytes]  variable length bytes for raw hostname or event-type.</listitem>
+             <listitem><para>[type]  (e.g., byte indicating hostname vs. event-type)</para></listitem>
+             <listitem><para>[bytes]  variable length bytes for raw hostname or event-type.</para></listitem>
 		  </itemizedlist>
         A column for this rowkey could be a long with an assigned number, which could be obtained by using an 
 		<link xlink:href="http://hbase.apache.org/apidocs/org/apache/hadoop/hbase/client/HTable.html#incrementColumnValue%28byte[],%20byte[],%20byte[],%20long%29">HBase counter</link>.
         </para>
         <para>So the resulting composite rowkey would be:
 		<itemizedlist>
-		  <listitem>[substituted long for hostname] = 8 bytes</listitem>
-		  <listitem>[substituted long for event type] = 8 bytes</listitem>
-		  <listitem>[timestamp] = 8 bytes</listitem>
+		  <listitem><para>[substituted long for hostname] = 8 bytes</para></listitem>
+		  <listitem><para>[substituted long for event type] = 8 bytes</para></listitem>
+		  <listitem><para>[timestamp] = 8 bytes</para></listitem>
 		</itemizedlist>
 		In either the Hash or Numeric substitution approach, the raw values for hostname and event-type can be stored as columns.
         </para>      
@@ -586,19 +586,19 @@ long bucket = timestamp % numBuckets;
       </para>
       <para>The Customer record type would include all the things that you’d typically expect:
         <itemizedlist>
-          <listitem>Customer number</listitem>
-          <listitem>Customer name</listitem>
-          <listitem>Address (e.g., city, state, zip)</listitem>
-          <listitem>Phone numbers, etc.</listitem>
+          <listitem><para>Customer number</para></listitem>
+          <listitem><para>Customer name</para></listitem>
+          <listitem><para>Address (e.g., city, state, zip)</para></listitem>
+          <listitem><para>Phone numbers, etc.</para></listitem>
         </itemizedlist>
      </para>
      <para>The Order record type would include things like:
         <itemizedlist>
-          <listitem>Customer number</listitem>
-          <listitem>Order number</listitem>
-          <listitem>Sales date</listitem>
-          <listitem>A series of nested objects for shipping locations and line-items (see <xref linkend="schema.casestudies.custorder.obj"/>
-           for details)</listitem>
+          <listitem><para>Customer number</para></listitem>
+          <listitem><para>Order number</para></listitem>
+          <listitem><para>Sales date</para></listitem>
+          <listitem><para>A series of nested objects for shipping locations and line-items (see <xref linkend="schema.casestudies.custorder.obj"/>
+           for details)</para></listitem>
         </itemizedlist>
     </para>
     <para>Assuming that the combination of customer number and sales order uniquely identify an order, these two attributes will compose
@@ -614,14 +614,14 @@ reasonable spread in the keyspace, similar options appear:
     </para>
     <para>Composite Rowkey With Hashes:  
       <itemizedlist>
-        <listitem>[MD5 of customer number] = 16 bytes</listitem>
-        <listitem>[MD5 of order number] = 16 bytes</listitem>
+        <listitem><para>[MD5 of customer number] = 16 bytes</para></listitem>
+        <listitem><para>[MD5 of order number] = 16 bytes</para></listitem>
       </itemizedlist>
     </para>
     <para>Composite Numeric/Hash Combo Rowkey: 
       <itemizedlist>
-        <listitem>[substituted long for customer number] = 8 bytes</listitem>
-        <listitem>[MD5 of order number] = 16 bytes</listitem>
+        <listitem><para>[substituted long for customer number] = 8 bytes</para></listitem>
+        <listitem><para>[MD5 of order number] = 16 bytes</para></listitem>
       </itemizedlist>
      </para>
         <section xml:id="schema.casestudies.custorder.tables">
@@ -631,15 +631,15 @@ reasonable spread in the keyspace, similar options appear:
             </para>
             <para>Customer Record Type Rowkey:
               <itemizedlist>
-                <listitem>[customer-id]</listitem>
-                <listitem>[type] = type indicating ‘1’ for customer record type</listitem>
+                <listitem><para>[customer-id]</para></listitem>
+                <listitem><para>[type] = type indicating ‘1’ for customer record type</para></listitem>
               </itemizedlist>
             </para>
             <para>Order Record Type Rowkey:
               <itemizedlist>
-                <listitem>[customer-id]</listitem>
-                <listitem>[type] = type indicating ‘2’ for order record type</listitem>
-                <listitem>[order]</listitem>
+                <listitem><para>[customer-id]</para></listitem>
+                <listitem><para>[type] = type indicating ‘2’ for order record type</para></listitem>
+                <listitem><para>[order]</para></listitem>
               </itemizedlist>
             </para>
             <para>The advantage of this particular CUSTOMER++ approach is that organizes many different record-types by customer-id 
@@ -665,23 +665,23 @@ reasonable spread in the keyspace, similar options appear:
 	        </para>
 	        <para>The SHIPPING_LOCATION's composite rowkey would be something like this:
 	          <itemizedlist>
-	            <listitem>[order-rowkey]</listitem>
-	            <listitem>[shipping location number] (e.g., 1st location, 2nd, etc.)</listitem>
+	            <listitem><para>[order-rowkey]</para></listitem>
+	            <listitem><para>[shipping location number] (e.g., 1st location, 2nd, etc.)</para></listitem>
 	          </itemizedlist>
 	        </para>
 	        <para>The LINE_ITEM table's composite rowkey would be something like this:
 	          <itemizedlist>
-	            <listitem>[order-rowkey]</listitem>
-	            <listitem>[shipping location number] (e.g., 1st location, 2nd, etc.)</listitem>
-	            <listitem>[line item number] (e.g., 1st lineitem, 2nd, etc.)</listitem>
+	            <listitem><para>[order-rowkey]</para></listitem>
+	            <listitem><para>[shipping location number] (e.g., 1st location, 2nd, etc.)</para></listitem>
+	            <listitem><para>[line item number] (e.g., 1st lineitem, 2nd, etc.)</para></listitem>
 	          </itemizedlist>
 	        </para>
 	        <para>Such a normalized model is likely to be the approach with an RDBMS, but that's not your only option with HBase.
 	        The cons of such an approach is that to retrieve information about any Order, you will need:
 	          <itemizedlist>
-	            <listitem>Get on the ORDER table for the Order</listitem>
-	            <listitem>Scan on the SHIPPING_LOCATION table for that order to get the ShippingLocation instances</listitem>
-	            <listitem>Scan on the LINE_ITEM for each ShippingLocation</listitem>
+	            <listitem><para>Get on the ORDER table for the Order</para></listitem>
+	            <listitem><para>Scan on the SHIPPING_LOCATION table for that order to get the ShippingLocation instances</para></listitem>
+	            <listitem><para>Scan on the LINE_ITEM for each ShippingLocation</para></listitem>
 	          </itemizedlist>
 	          ... granted, this is what an RDBMS would do under the covers anyway, but since there are no joins in HBase
 	          you're just more aware of this fact.
@@ -693,23 +693,23 @@ reasonable spread in the keyspace, similar options appear:
 	        </para>
 	        <para>The Order rowkey was described above: <xref linkend="schema.casestudies.custorder"/>
 	          <itemizedlist>
-	            <listitem>[order-rowkey]</listitem>
-	            <listitem>[ORDER record type]</listitem>
+	            <listitem><para>[order-rowkey]</para></listitem>
+	            <listitem><para>[ORDER record type]</para></listitem>
 	          </itemizedlist>
 	        </para>
 	        <para>The ShippingLocation composite rowkey would be something like this:
 	          <itemizedlist>
-	            <listitem>[order-rowkey]</listitem>
-	            <listitem>[SHIPPING record type]</listitem>
-	            <listitem>[shipping location number] (e.g., 1st location, 2nd, etc.)</listitem>
+	            <listitem><para>[order-rowkey]</para></listitem>
+	            <listitem><para>[SHIPPING record type]</para></listitem>
+	            <listitem><para>[shipping location number] (e.g., 1st location, 2nd, etc.)</para></listitem>
 	          </itemizedlist>
 	        </para>
 	        <para>The LineItem composite rowkey would be something like this:
 	          <itemizedlist>
-	            <listitem>[order-rowkey]</listitem>
-	            <listitem>[LINE record type]</listitem>
-	            <listitem>[shipping location number] (e.g., 1st location, 2nd, etc.)</listitem>
-	            <listitem>[line item number] (e.g., 1st lineitem, 2nd, etc.)</listitem>
+	            <listitem><para>[order-rowkey]</para></listitem>
+	            <listitem><para>[LINE record type]</para></listitem>
+	            <listitem><para>[shipping location number] (e.g., 1st location, 2nd, etc.)</para></listitem>
+	            <listitem><para>[line item number] (e.g., 1st lineitem, 2nd, etc.)</para></listitem>
 	          </itemizedlist>
 	        </para>
 	      </section>
@@ -720,21 +720,21 @@ reasonable spread in the keyspace, similar options appear:
 	        </para>
 	        <para>The LineItem composite rowkey would be something like this:
 	          <itemizedlist>
-	            <listitem>[order-rowkey]</listitem>
-	            <listitem>[LINE record type]</listitem>
-	            <listitem>[line item number] (e.g., 1st lineitem, 2nd, etc. - care must be taken that there are unique across the entire order)</listitem>
+	            <listitem><para>[order-rowkey]</para></listitem>
+	            <listitem><para>[LINE record type]</para></listitem>
+	            <listitem><para>[line item number] (e.g., 1st lineitem, 2nd, etc. - care must be taken that there are unique across the entire order)</para></listitem>
 	          </itemizedlist>
 	        </para>
 	        <para>... and the LineItem columns would be something like this:
 	          <itemizedlist>
-	            <listitem>itemNumber</listitem>
-	            <listitem>quantity</listitem>
-	            <listitem>price</listitem>
-	            <listitem>shipToLine1 (denormalized from ShippingLocation)</listitem>
-	            <listitem>shipToLine2 (denormalized from ShippingLocation)</listitem>
-	            <listitem>shipToCity (denormalized from ShippingLocation)</listitem>
-	            <listitem>shipToState (denormalized from ShippingLocation)</listitem>
-	            <listitem>shipToZip (denormalized from ShippingLocation)</listitem>
+	            <listitem><para>itemNumber</para></listitem>
+	            <listitem><para>quantity</para></listitem>
+	            <listitem><para>price</para></listitem>
+	            <listitem><para>shipToLine1 (denormalized from ShippingLocation)</para></listitem>
+	            <listitem><para>shipToLine2 (denormalized from ShippingLocation)</para></listitem>
+	            <listitem><para>shipToCity (denormalized from ShippingLocation)</para></listitem>
+	            <listitem><para>shipToState (denormalized from ShippingLocation)</para></listitem>
+	            <listitem><para>shipToZip (denormalized from ShippingLocation)</para></listitem>
 	          </itemizedlist>
 	        </para>
 	        <para>The pros of this approach include a less complex object heirarchy, but one of the cons is that updating gets more 
@@ -789,7 +789,7 @@ reasonable spread in the keyspace, similar options appear:
 	    OpenTSDB is the best example of this case where a single row represents a defined time-range, and then discrete events are treated as
 	    columns.  This approach is often more complex, and may require the additional complexity of re-writing your data, but has the
 	    advantage of being I/O efficient.  For an overview of this approach, see
-	    <xref linkend="schema.casestudies.log-timeseries.log-steroids"/>.
+	      <xref linkend="schema.casestudies.log-steroids"/>.
 	    </para>
 	  </section>
 	</section>  
@@ -815,7 +815,7 @@ we could have something like:
 &lt;FixedWidthUserName&gt;&lt;FixedWidthValueId3&gt;:"" (no value)
 			</programlisting>
 
-The other option we had was to do this entirely using:
+<para>The other option we had was to do this entirely using:</para>
     		<programlisting>
 &lt;FixedWidthUserName&gt;&lt;FixedWidthPageNum0&gt;:&lt;FixedWidthLength&gt;&lt;FixedIdNextPageNum&gt;&lt;ValueId1&gt;&lt;ValueId2&gt;&lt;ValueId3&gt;...
 &lt;FixedWidthUserName&gt;&lt;FixedWidthPageNum1&gt;:&lt;FixedWidthLength&gt;&lt;FixedIdNextPageNum&gt;&lt;ValueId1&gt;&lt;ValueId2&gt;&lt;ValueId3&gt;...
@@ -827,8 +827,8 @@ So in one case reading the first thirty values would be:
     		<programlisting>
 scan { STARTROW =&gt; 'FixedWidthUsername' LIMIT =&gt; 30}
     		</programlisting>
-And in the second case it would be
-    		<programlisting>
+<para>And in the second case it would be
+</para>    		<programlisting>
 get 'FixedWidthUserName\x00\x00\x00\x00'
     		</programlisting>
 			<para>
diff --git a/src/main/docbkx/security.xml b/src/main/docbkx/security.xml
index 47975228771..1bac920e455 100644
--- a/src/main/docbkx/security.xml
+++ b/src/main/docbkx/security.xml
@@ -517,7 +517,7 @@
     <para>
        You must configure HBase for secure or simple user access operation. Refer to the
        <link linkend='hbase.accesscontrol.configuration'>Secure Client Access to HBase</link> or
-       <link linkend='hbase.accesscontrol.simpleconfiguration'>Simple User Access to HBase</link>
+       <link linkend='hbase.secure.simpleconfiguration'>Simple User Access to HBase</link>
         sections and complete all of the steps described
        there.
     </para>
@@ -779,14 +779,16 @@ Access control mechanisms are mature and fairly standardized in the relational d
     <para>
 The HBase shell has been extended to provide simple commands for editing and updating user permissions. The following commands have been added for access control list management:
     </para>
-    Grant
-    <para>
-    <programlisting>
+
+
+ <example>   
+   <title>Grant</title>
+   <programlisting>
     grant &lt;user|@group&gt; &lt;permissions&gt; [ &lt;table&gt; [ &lt;column family&gt; [ &lt;column qualifier&gt; ] ] ]
-    </programlisting>
-    </para>
+    </programlisting></example>
+    
     <para>
-    <code class="code">&lt;user|@group&gt;</code> is user or group  (start with character '@'), Groups are created and manipulated via the Hadoop group mapping service.
+    <code>&lt;user|@group&gt;</code> is user or group  (start with character '@'), Groups are created and manipulated via the Hadoop group mapping service.
     </para>
     <para>
     <code>&lt;permissions&gt;</code> is zero or more letters from the set "RWCA": READ('R'), WRITE('W'), CREATE('C'), ADMIN('A').
@@ -794,32 +796,32 @@ The HBase shell has been extended to provide simple commands for editing and upd
     <para>
     Note: Grants and revocations of individual permissions on a resource are both accomplished using the <code>grant</code> command. A separate <code>revoke</code> command is also provided by the shell, but this is for fast revocation of all of a user's access rights to a given resource only.
     </para>
-    <para>
-    Revoke
-    </para>
-    <para>
+    <example>
+      <title>Revoke</title>
+
     <programlisting>
     revoke &lt;user|@group&gt; [ &lt;table&gt; [ &lt;column family&gt; [ &lt;column qualifier&gt; ] ] ]
     </programlisting>
-    </para>
+    </example>
+<example>
+  <title>Alter</title>
+
     <para>
-    Alter
-    </para>
-    <para>
-    The <code>alter</code> command has been extended to allow ownership assignment:
+    The <code>alter</code> command has been extended to allow ownership assignment:</para>
     <programlisting>
       alter 'tablename', {OWNER => 'username|@group'}
     </programlisting>
-    </para>
+</example>
+      
+<example>
+  <title>User Permission</title>
+
     <para>
-    User Permission
-    </para>
-    <para>
-    The <code>user_permission</code> command shows all access permissions for the current user for a given table:
+    The <code>user_permission</code> command shows all access permissions for the current user for a given table:</para>
     <programlisting>
       user_permission &lt;table&gt;
     </programlisting>
-    </para>
+</example>
   </section>
 
 </section>  <!-- Access Control -->
@@ -829,12 +831,12 @@ The HBase shell has been extended to provide simple commands for editing and upd
     <para>
 	Bulk loading in secure mode is a bit more involved than normal setup, since the client has to transfer the ownership of the files generated from the mapreduce job to HBase. Secure bulk loading is implemented by a coprocessor, named <link xlink:href="http://hbase.apache.org/apidocs/org/apache/hadoop/hbase/security/access/SecureBulkLoadEndpoint.html">SecureBulkLoadEndpoint</link>. SecureBulkLoadEndpoint uses a staging directory <code>"hbase.bulkload.staging.dir"</code>, which defaults to <code>/tmp/hbase-staging/</code>. The algorithm is as follows.
 	<itemizedlist>
-      <listitem>Create an hbase owned staging directory which is world traversable (<code>-rwx--x--x, 711</code>) <code>/tmp/hbase-staging</code>. </listitem>
-      <listitem>A user writes out data to his secure output directory: /user/foo/data </listitem>
-      <listitem>A call is made to hbase to create a secret staging directory
-  which is globally readable/writable (<code>-rwxrwxrwx, 777</code>): /tmp/hbase-staging/averylongandrandomdirectoryname</listitem>
-  <listitem>The user makes the data world readable and writable, then moves it
-  into the random staging directory, then calls bulkLoadHFiles()</listitem>
+      <listitem><para>Create an hbase owned staging directory which is world traversable (<code>-rwx--x--x, 711</code>) <code>/tmp/hbase-staging</code>. </para></listitem>
+      <listitem><para>A user writes out data to his secure output directory: /user/foo/data </para></listitem>
+      <listitem><para>A call is made to hbase to create a secret staging directory
+  which is globally readable/writable (<code>-rwxrwxrwx, 777</code>): /tmp/hbase-staging/averylongandrandomdirectoryname</para></listitem>
+  <listitem><para>The user makes the data world readable and writable, then moves it
+  into the random staging directory, then calls bulkLoadHFiles()</para></listitem>
   </itemizedlist>
   </para>
   <para>
@@ -870,9 +872,9 @@ The HBase shell has been extended to provide simple commands for editing and upd
 	<para>
 	Visibility expressions like the above can be added when storing or mutating a cell using the API,
 	</para>
-	<para><code>Mutation#setCellVisibility(new CellVisibility(String labelExpession));</code></para>
-	Where the labelExpression could be &#39;( secret | topsecret ) &amp; !probationary&#39;
-	
+	<programlisting>Mutation#setCellVisibility(new CellVisibility(String labelExpession));</programlisting>
+<para>	Where the labelExpression could be &#39;( secret | topsecret ) &amp; !probationary&#39;
+</para>	
 	<para>
 	We build the user&#39;s label set in the RPC context when a request is first received by the HBase RegionServer. How users are associated with labels is pluggable. The default plugin passes through labels specified in Authorizations added to the Get or Scan and checks those against the calling user&#39;s authenticated labels list. When client passes some labels for which the user is not authenticated, this default algorithm will drop those. One can pass a subset of user authenticated labels via the Scan/Get authorizations.
 	</para>
@@ -896,7 +898,7 @@ The HBase shell has been extended to provide simple commands for editing and upd
 			</para>
 		</section>
 
-		<section xml:id="hbase.visibility.label.administration.add.label">
+		<section xml:id="hbase.visibility.label.administration.add.label2">
 		    <title>User Label Association</title>
 			<para>A set of labels can be associated with a user by using the API</para>
 			<para><code>VisibilityClient#setAuths(Configuration conf, final String[] auths, final String user)</code></para>
diff --git a/src/main/docbkx/troubleshooting.xml b/src/main/docbkx/troubleshooting.xml
index 7aebedaa99b..4c426d80ce9 100644
--- a/src/main/docbkx/troubleshooting.xml
+++ b/src/main/docbkx/troubleshooting.xml
@@ -235,7 +235,7 @@ export SERVER_GC_OPTS="$SERVER_GC_OPTS -XX:NewSize=64m -XX:MaxNewSize=64m"
         is generally used for questions on released versions of Apache HBase.  Before going to the mailing list, make sure your
         question has not already been answered by searching the mailing list archives first.  Use
         <xref linkend="trouble.resources.searchhadoop" />.
-        Take some time crafting your question<footnote><para>See <link xlink="http://www.mikeash.com/getting_answers.html">Getting Answers</link></para></footnote>; a quality question that includes all context and
+        Take some time crafting your question<footnote><para>See <link xlink:href="http://www.mikeash.com/getting_answers.html">Getting Answers</link></para></footnote>; a quality question that includes all context and
         exhibits evidence the author has tried to find answers in the manual and out on lists
         is more likely to get a prompt response.
         </para>
@@ -360,15 +360,15 @@ hadoop@sv4borg12:~$ jps
         </programlisting>
         In order, we see a:
         <itemizedlist>
-          <listitem>Hadoop TaskTracker, manages the local Childs</listitem>
-          <listitem>HBase RegionServer, serves regions</listitem>
-          <listitem>Child, its MapReduce task, cannot tell which type exactly</listitem>
-          <listitem>Hadoop TaskTracker, manages the local Childs</listitem>
-          <listitem>Hadoop DataNode, serves blocks</listitem>
-          <listitem>HQuorumPeer, a ZooKeeper ensemble member</listitem>
-          <listitem>Jps, well… it’s the current process</listitem>
-          <listitem>ThriftServer, it’s a special one will be running only if thrift was started</listitem>
-          <listitem>jmx, this is a local process that’s part of our monitoring platform ( poorly named maybe). You probably don’t have that.</listitem>
+          <listitem><para>Hadoop TaskTracker, manages the local Childs</para></listitem>
+          <listitem><para>HBase RegionServer, serves regions</para></listitem>
+          <listitem><para>Child, its MapReduce task, cannot tell which type exactly</para></listitem>
+          <listitem><para>Hadoop TaskTracker, manages the local Childs</para></listitem>
+          <listitem><para>Hadoop DataNode, serves blocks</para></listitem>
+          <listitem><para>HQuorumPeer, a ZooKeeper ensemble member</para></listitem>
+          <listitem><para>Jps, well… it’s the current process</para></listitem>
+          <listitem><para>ThriftServer, it’s a special one will be running only if thrift was started</para></listitem>
+          <listitem><para>jmx, this is a local process that’s part of our monitoring platform ( poorly named maybe). You probably don’t have that.</para></listitem>
         </itemizedlist>
         </para>
         <para>
@@ -620,21 +620,19 @@ Harsh J investigated the issue as part of the mailing list thread
        </section>
        <section xml:id="trouble.client.oome.directmemory.leak">
             <title>Client running out of memory though heap size seems to be stable (but the off-heap/direct heap keeps growing)</title>
-            <para> You are likely running into the issue that is described and worked through in the
-        mail thread <link
-          xhref="http://search-hadoop.com/m/ubhrX8KvcH/Suspected+memory+leak&amp;subj=Re+Suspected+memory+leak"
-          >HBase, mail # user - Suspected memory leak</link> and continued over in <link
-          xhref="http://search-hadoop.com/m/p2Agc1Zy7Va/MaxDirectMemorySize+Was%253A+Suspected+memory+leak&amp;subj=Re+FeedbackRe+Suspected+memory+leak"
-          >HBase, mail # dev - FeedbackRe: Suspected memory leak</link>. A workaround is passing
-        your client-side JVM a reasonable value for <code>-XX:MaxDirectMemorySize</code>. By
-        default, the <varname>MaxDirectMemorySize</varname> is equal to your <code>-Xmx</code> max
-        heapsize setting (if <code>-Xmx</code> is set). Try seting it to something smaller (for
-        example, one user had success setting it to <code>1g</code> when they had a client-side heap
-        of <code>12g</code>). If you set it too small, it will bring on <code>FullGCs</code> so keep
-        it a bit hefty. You want to make this setting client-side only especially if you are running
-        the new experimental server-side off-heap cache since this feature depends on being able to
-        use big direct buffers (You may have to keep separate client-side and server-side config
-        dirs). </para>
+            <para>
+You are likely running into the issue that is described and worked through in
+the mail thread <link xlink:href="http://search-hadoop.com/m/ubhrX8KvcH/Suspected+memory+leak&amp;subj=Re+Suspected+memory+leak">HBase, mail # user - Suspected memory leak</link>
+and continued over in <link xlink:href="http://search-hadoop.com/m/p2Agc1Zy7Va/MaxDirectMemorySize+Was%253A+Suspected+memory+leak&amp;subj=Re+FeedbackRe+Suspected+memory+leak">HBase, mail # dev - FeedbackRe: Suspected memory leak</link>.
+A workaround is passing your client-side JVM a reasonable value for <code>-XX:MaxDirectMemorySize</code>.  By default,
+the <varname>MaxDirectMemorySize</varname> is equal to your <code>-Xmx</code> max heapsize setting (if <code>-Xmx</code> is set).
+Try seting it to something smaller (for example, one user had success setting it to <code>1g</code> when
+they had a client-side heap of <code>12g</code>).  If you set it too small, it will bring on <code>FullGCs</code> so keep
+it  a bit hefty.  You want to make this setting client-side only especially if you are running the new experiemental
+server-side off-heap cache since this feature depends on being able to use big direct buffers (You may have to keep
+separate client-side and server-side config dirs).
+            </para>
+
        </section>
        <section xml:id="trouble.client.slowdown.admin">
             <title>Client Slowdown When Calling Admin Methods (flush, compact, etc.)</title>
@@ -753,7 +751,7 @@ Caused by: java.io.FileNotFoundException: File _partition.lst does not exist.
                <filename>/&lt;HLog&gt;</filename>           (WAL HLog files for the RegionServer)
             </programlisting>
             </para>
-		    <para>See the <link xlink:href="see http://hadoop.apache.org/common/docs/current/hdfs_user_guide.html">HDFS User Guide</link> for other non-shell diagnostic
+		    <para>See the <link xlink:href="http://hadoop.apache.org/common/docs/current/hdfs_user_guide.html">HDFS User Guide</link> for other non-shell diagnostic
 		    utilities like <code>fsck</code>.
             </para>
           <section xml:id="trouble.namenode.0size.hlogs">
@@ -926,25 +924,26 @@ ERROR org.apache.hadoop.hbase.regionserver.HRegionServer: ZooKeeper session expi
            Since the RegionServer's local ZooKeeper client cannot send heartbeats, the session times out.
            By design, we shut down any node that isn't able to contact the ZooKeeper ensemble after getting a timeout so that it stops serving data that may already be assigned elsewhere.
            </para>
-           <para>
+
             <itemizedlist>
-              <listitem>Make sure you give plenty of RAM (in <filename>hbase-env.sh</filename>), the default of 1GB won't be able to sustain long running imports.</listitem>
-              <listitem>Make sure you don't swap, the JVM never behaves well under swapping.</listitem>
-              <listitem>Make sure you are not CPU starving the RegionServer thread. For example, if you are running a MapReduce job using 6 CPU-intensive tasks on a machine with 4 cores, you are probably starving the RegionServer enough to create longer garbage collection pauses.</listitem>
-              <listitem>Increase the ZooKeeper session timeout</listitem>
+              <listitem><para>Make sure you give plenty of RAM (in <filename>hbase-env.sh</filename>), the default of 1GB won't be able to sustain long running imports.</para></listitem>
+              <listitem><para>Make sure you don't swap, the JVM never behaves well under swapping.</para></listitem>
+              <listitem><para>Make sure you are not CPU starving the RegionServer thread. For example, if you are running a MapReduce job using 6 CPU-intensive tasks on a machine with 4 cores, you are probably starving the RegionServer enough to create longer garbage collection pauses.</para></listitem>
+              <listitem><para>Increase the ZooKeeper session timeout</para></listitem>
            </itemizedlist>
-           If you wish to increase the session timeout, add the following to your <filename>hbase-site.xml</filename> to increase the timeout from the default of 60 seconds to 120 seconds.
-           <programlisting>
-&lt;property&gt;
-    &lt;name&gt;zookeeper.session.timeout&lt;/name&gt;
-    &lt;value&gt;1200000&lt;/value&gt;
-&lt;/property&gt;
-&lt;property&gt;
-    &lt;name&gt;hbase.zookeeper.property.tickTime&lt;/name&gt;
-    &lt;value&gt;6000&lt;/value&gt;
-&lt;/property&gt;
+           <para>If you wish to increase the session timeout, add the following to your <filename>hbase-site.xml</filename> to increase the timeout from the default of 60 seconds to 120 seconds.
+</para>           
+          <programlisting>
+<![CDATA[<property>
+    <name>zookeeper.session.timeout</name>
+    <value>1200000</value>
+</property>
+<property>
+    <name>hbase.zookeeper.property.tickTime</name>
+    <value>6000</value>
+</property>]]>
             </programlisting>
-           </para>
+           
            <para>
            Be aware that setting a higher timeout means that the regions served by a failed RegionServer will take at least
            that amount of time to be transfered to another RegionServer. For a production system serving live requests, we would instead
@@ -954,8 +953,8 @@ ERROR org.apache.hadoop.hbase.regionserver.HRegionServer: ZooKeeper session expi
            <para>
            If this is happening during an upload which only happens once (like initially loading all your data into HBase), consider bulk loading.
            </para>
-           See <xref linkend="trouble.zookeeper.general"/> for other general information about ZooKeeper troubleshooting.
-        </section>
+<para>See <xref linkend="trouble.zookeeper.general"/> for other general information about ZooKeeper troubleshooting.
+</para>        </section>
         <section xml:id="trouble.rs.runtime.notservingregion">
            <title>NotServingRegionException</title>
            <para>This exception is "normal" when found in the RegionServer logs at DEBUG level.  This exception is returned back to the client
@@ -970,7 +969,7 @@ ERROR org.apache.hadoop.hbase.regionserver.HRegionServer: ZooKeeper session expi
            RegionServer is not using the name given it by the master; double entry in master listing of servers</link> for gorey details.
           </para>
         </section>
-        <section xml:id="trouble.rs.runtime.codecmsgs">
+        <section xml:id="brand.new.compressor">
           <title>Logs flooded with '2011-01-10 12:40:48,407 INFO org.apache.hadoop.io.compress.CodecPool: Got
             brand-new compressor' messages</title>
                 <para>We are not using the native versions of compression
@@ -992,7 +991,7 @@ ERROR org.apache.hadoop.hbase.regionserver.HRegionServer: ZooKeeper session expi
       </section>
       <section xml:id="trouble.rs.shutdown">
         <title>Shutdown Errors</title>
-
+  <para />
       </section>
 
     </section>
@@ -1020,7 +1019,7 @@ ERROR org.apache.hadoop.hbase.regionserver.HRegionServer: ZooKeeper session expi
       </section>
       <section xml:id="trouble.master.shutdown">
         <title>Shutdown Errors</title>
-
+        <para/>
       </section>
 
     </section>
diff --git a/src/main/docbkx/upgrading.xml b/src/main/docbkx/upgrading.xml
index 7711614d21b..758d6d4317c 100644
--- a/src/main/docbkx/upgrading.xml
+++ b/src/main/docbkx/upgrading.xml
@@ -225,8 +225,8 @@
              Now start up hbase-0.96.0.
          </para>
      </section>
-     <section xml:id="096.migration.troubleshooting"><title>Troubleshooting</title>
-     <section xml:id="096.migration.troubleshooting.old.client"><title>Old Client connecting to 0.96 cluster</title>
+     <section xml:id="s096.migration.troubleshooting"><title>Troubleshooting</title>
+     <section xml:id="s096.migration.troubleshooting.old.client"><title>Old Client connecting to 0.96 cluster</title>
          <para>It will fail with an exception like the below.  Upgrade.
              <programlisting>17:22:15  Exception in thread "main" java.lang.IllegalArgumentException: Not a host:port pair: PBUF
 17:22:15  *
@@ -266,20 +266,20 @@
 <para>
 If you've not patience, here are the important things to know upgrading.
 <orderedlist>
-<listitem>Once you upgrade, you can’t go back.
+<listitem><para>Once you upgrade, you can’t go back.</para>
 </listitem>
-<listitem>
-MSLAB is on by default. Watch that heap usage if you have a lot of regions.
+<listitem><para>
+MSLAB is on by default. Watch that heap usage if you have a lot of regions.</para>
 </listitem>
-<listitem>
+<listitem><para>
 Distributed splitting is on by defaul.  It should make region server failover faster.
-</listitem>
-<listitem>
+</para></listitem>
+<listitem><para>
 There’s a separate tarball for security.
-</listitem>
-<listitem>
+</para></listitem>
+<listitem><para>
 If -XX:MaxDirectMemorySize is set in your hbase-env.sh, it’s going to enable the experimental off-heap cache (You may not want this).
-</listitem>
+</para></listitem>
 </orderedlist>
 </para>
 </note>
@@ -301,7 +301,7 @@ This means you cannot go back to 0.90.x once you’ve started HBase 0.92.0 over
 <para>In 0.92.0, the <link xlink:href="http://hbase.apache.org/book.html#hbase.hregion.memstore.mslab.enabled">hbase.hregion.memstore.mslab.enabled</link> flag is set to true
 (See <xref linkend="mslab" />).  In 0.90.x it was <constant>false</constant>.  When it is enabled, memstores will step allocate memory in MSLAB 2MB chunks even if the
 memstore has zero or just a few small elements.  This is fine usually but if you had lots of regions per regionserver in a 0.90.x cluster (and MSLAB was off),
-you may find yourself OOME'ing on upgrade because the <mathphrase>thousands of regions * number of column families * 2MB MSLAB (at a minimum)</mathphrase>
+you may find yourself OOME'ing on upgrade because the <code>thousands of regions * number of column families * 2MB MSLAB (at a minimum)</code>
 puts your heap over the top.  Set <varname>hbase.hregion.memstore.mslab.enabled</varname> to
 <constant>false</constant> or set the MSLAB size down from 2MB by setting <varname>hbase.hregion.memstore.mslab.chunksize</varname> to something less.
 </para>
diff --git a/src/main/docbkx/zookeeper.xml b/src/main/docbkx/zookeeper.xml
index 4a257b59452..d4d87749784 100644
--- a/src/main/docbkx/zookeeper.xml
+++ b/src/main/docbkx/zookeeper.xml
@@ -219,7 +219,7 @@ ${HBASE_HOME}/bin/hbase-daemons.sh {start,stop} zookeeper
               standalone Zookeeper quorum) for ease of learning.
               </para>
 
-              <section><title>Operating System Prerequisites</title></section>
+              <section><title>Operating System Prerequisites</title>
 
               <para>
                   You need to have a working Kerberos KDC setup. For
@@ -283,7 +283,7 @@ ${HBASE_HOME}/bin/hbase-daemons.sh {start,stop} zookeeper
 
                 <para>We'll refer to this JAAS configuration file as
                 <filename>$CLIENT_CONF</filename> below.</para>
-
+              </section>
               <section>
                 <title>HBase-managed Zookeeper Configuration</title>
 
@@ -312,10 +312,10 @@ ${HBASE_HOME}/bin/hbase-daemons.sh {start,stop} zookeeper
                   };
                 </programlisting>
 
-                where the <filename>$PATH_TO_HBASE_KEYTAB</filename> and
+                <para>where the <filename>$PATH_TO_HBASE_KEYTAB</filename> and
                 <filename>$PATH_TO_ZOOKEEPER_KEYTAB</filename> files are what
                 you created above, and <code>$HOST</code> is the hostname for that
-                node.
+                node.</para>
 
                 <para>The <code>Server</code> section will be used by
                 the Zookeeper quorum server, while the
@@ -342,9 +342,9 @@ ${HBASE_HOME}/bin/hbase-daemons.sh {start,stop} zookeeper
                   export HBASE_REGIONSERVER_OPTS="-Djava.security.auth.login.config=$HBASE_SERVER_CONF"
                 </programlisting>
 
-                where <filename>$HBASE_SERVER_CONF</filename> and
+                <para>where <filename>$HBASE_SERVER_CONF</filename> and
                 <filename>$CLIENT_CONF</filename> are the full paths to the
-                JAAS configuration files created above.
+                JAAS configuration files created above.</para>
 
                 <para>Modify your <filename>hbase-site.xml</filename> on each node
                 that will run zookeeper, master or regionserver to contain:</para>
@@ -537,10 +537,10 @@ ${HBASE_HOME}/bin/hbase-daemons.sh {start,stop} zookeeper
               <section>
                 <title>Configuration from Scratch</title>
 
-                This has been tested on the current standard Amazon
+                <para>This has been tested on the current standard Amazon
                 Linux AMI.  First setup KDC and principals as
                 described above. Next checkout code and run a sanity
-                check.
+                check.</para>
 
                 <programlisting>
                 git clone git://git.apache.org/hbase.git
@@ -548,9 +548,9 @@ ${HBASE_HOME}/bin/hbase-daemons.sh {start,stop} zookeeper
                 mvn clean test -Dtest=TestZooKeeperACL
                 </programlisting>
 
-                Then configure HBase as described above.
-                Manually edit target/cached_classpath.txt (see below)..
-
+                <para>Then configure HBase as described above.
+                Manually edit target/cached_classpath.txt (see below):
+</para>
                 <programlisting>
                 bin/hbase zookeeper &amp;
                 bin/hbase master &amp;
@@ -582,14 +582,16 @@ ${HBASE_HOME}/bin/hbase-daemons.sh {start,stop} zookeeper
                   programmatically</title>
 
 
-                  This would avoid the need for a separate Hadoop jar
+                  <para>This would avoid the need for a separate Hadoop jar
                   that fixes <link xlink:href="https://issues.apache.org/jira/browse/HADOOP-7070">HADOOP-7070</link>.
+                  </para>
                 </section>
 
                 <section>
                   <title>Elimination of
                   <code>kerberos.removeHostFromPrincipal</code> and
                   <code>kerberos.removeRealmFromPrincipal</code></title>
+                  <para />
                 </section>
 
               </section>