HBASE-1699 Remove hbrep example as it's too out of date

git-svn-id: https://svn.apache.org/repos/asf/hadoop/hbase/trunk@797512 13f79535-47bb-0310-9956-ffa450edef68
2009-07-24 15:01:09 +00:00 · 2009-07-24 15:01:09 +00:00 · 3e7c6a6e4f
parent 926a17e351
commit 3e7c6a6e4f
15 changed files with 1 additions and 6735 deletions
--- a/CHANGES.txt
+++ b/CHANGES.txt
@ -508,6 +508,7 @@ Release 0.20.0 - Unreleased
   HBASE-1688  Improve javadocs in Result and KeyValue
   HBASE-1694  Add TOC to 'Getting Started', add references to THBase and
               ITHBase
+   HBASE-1699  Remove hbrep example as it's too out of date

  OPTIMIZATIONS
   HBASE-1412  Change values for delete column and column family in KeyValue
--- a/src/examples/uploaders/hbrep/HBaseConnection.py
+++ b/src/examples/uploaders/hbrep/HBaseConnection.py
@ -1,39 +0,0 @@
-import sys, os
-
-from Hbase.ttypes import *
-from Hbase import Hbase
-
-from thrift import Thrift
-from thrift.transport import TSocket, TTransport
-from thrift.protocol import TBinaryProtocol
-
-class HBaseConnection:
-  def __init__(self, hostname, port):
-    # Make socket
-    self.transport = TSocket.TSocket(hostname, port)
-    # Buffering is critical. Raw sockets are very slow
-    self.transport = TTransport.TBufferedTransport(self.transport)
-    # Wrap in a protocol
-    self.protocol = TBinaryProtocol.TBinaryProtocol(self.transport)
-    # Create a client to use the protocol encoder
-    self.client = Hbase.Client(self.protocol)
- 
-  def connect(self):  
-    self.transport.open()
-   
-  def disconnect(self):
-    self.transport.close()
-    
-  def validate_column_descriptors(self, table_name, column_descriptors):
-    hbase_families = self.client.getColumnDescriptors(table_name)
-    for col_desc in column_descriptors:
-      family, column = col_desc.split(":")
-      if not family in hbase_families:
-        raise Exception("Invalid column descriptor \"%s\" for hbase table \"%s\"" % (col_desc,table_name))
-      
-  def validate_table_name(self, table_name):
-    if not table_name in self.client.getTableNames():
-      raise Exception("hbase table '%s' not found." % (table_name))
-    
-  
-  
--- a/src/examples/uploaders/hbrep/HBaseConsumer.py
+++ b/src/examples/uploaders/hbrep/HBaseConsumer.py
@ -1,90 +0,0 @@
-import sys, os, pgq, skytools, ConfigParser
-
-from thrift import Thrift
-from thrift.transport import TSocket, TTransport
-from thrift.protocol import TBinaryProtocol
-
-from HBaseConnection import *
-import tablemapping
-
-INSERT = 'I'
-UPDATE = 'U'
-DELETE = 'D'
-
-class HBaseConsumer(pgq.Consumer):
-  """HBaseConsumer is a pgq.Consumer that sends processed events to hbase as mutations."""
-  
-  def __init__(self, service_name, args):
-    pgq.Consumer.__init__(self, service_name, "postgresql_db", args)
-    
-    config_file = self.args[0]
-    if len(self.args) < 2:
-      print "need table names"
-      sys.exit(1)
-    else:
-      self.table_names = self.args[1:]
-      
-    #just to check this option exists
-    self.cf.get("postgresql_db")
-    
-    self.max_batch_size = int(self.cf.get("max_batch_size", "10000"))
-    self.hbase_hostname = self.cf.get("hbase_hostname", "localhost")
-    self.hbase_port = int(self.cf.get("hbase_port", "9090"))
-    self.row_limit = int(self.cf.get("bootstrap_row_limit", 0))
-    self.table_mappings = tablemapping.load_table_mappings(config_file, self.table_names)
-  
-  def process_batch(self, source_db, batch_id, event_list):
-    try:
-      self.log.debug("processing batch %s" % (batch_id))
-      hbase = HBaseConnection(self.hbase_hostname, self.hbase_port)
-      try:
-        self.log.debug("Connecting to HBase")
-        hbase.connect()
-              
-        i = 0L
-        for event in event_list:
-          i = i+1
-          self.process_event(event, hbase)
-        print "%i events processed" % (i)
-        
-      except Exception, e:
-        #self.log.info(e)
-        sys.exit(e)
-      
-    finally:
-      hbase.disconnect()
-  
-  def process_event(self, event, hbase):
-    if event.ev_extra1 in self.table_mappings:
-      table_mapping = self.table_mappings[event.ev_extra1]
-    else:
-      self.log.info("table name not found in config, skipping event")
-      return
-    #hbase.validate_table_name(table_mapping.hbase_table_name)
-    #hbase.validate_column_descriptors(table_mapping.hbase_table_name, table_mapping.hbase_column_descriptors)
-    event_data = skytools.db_urldecode(event.data)
-    event_type = event.type.split(':')[0]
-    
-    batch = BatchMutation()
-    batch.row = table_mapping.hbase_row_prefix + str(event_data[table_mapping.psql_key_column])
-        
-    batch.mutations = []
-    for psql_column, hbase_column in zip(table_mapping.psql_columns, table_mapping.hbase_column_descriptors):
-      if event_type == INSERT or event_type == UPDATE:
-        m = Mutation()
-        m.column = hbase_column
-        m.value = str(event_data[psql_column])
-      elif event_type == DELETE:
-        # delete this column entry
-        m = Mutation()
-        m.isDelete = True
-        m.column = hbase_column
-      else:
-        raise Exception("Invalid event type: %s, event data was: %s" % (event_type, str(event_data)))
-      batch.mutations.append(m)
-    hbase.client.mutateRow(table_mapping.hbase_table_name, batch.row, batch.mutations)
-    event.tag_done()
-    
-if __name__ == '__main__':
-  script = HBaseConsumer("HBaseReplic",sys.argv[1:])
-  script.start()
--- a/src/examples/uploaders/hbrep/Hbase/Hbase-remote
+++ b/src/examples/uploaders/hbrep/Hbase/Hbase-remote
@ -1,247 +0,0 @@
-#!/usr/bin/env python
-#
-# Autogenerated by Thrift
-#
-# DO NOT EDIT UNLESS YOU ARE SURE THAT YOU KNOW WHAT YOU ARE DOING
-#
-
-import sys
-import pprint
-from urlparse import urlparse
-from thrift.transport import TTransport
-from thrift.transport import TSocket
-from thrift.transport import THttpClient
-from thrift.protocol import TBinaryProtocol
-
-import Hbase
-from ttypes import *
-
-if len(sys.argv) <= 1 or sys.argv[1] == '--help':
-  print ''
-  print 'Usage: ' + sys.argv[0] + ' [-h host:port] [-u url] [-f[ramed]] function [arg1 [arg2...]]'
-  print ''
-  print 'Functions:'
-  print '   getTableNames()'
-  print '   getColumnDescriptors(Text tableName)'
-  print '   getTableRegions(Text tableName)'
-  print '  void createTable(Text tableName,  columnFamilies)'
-  print '  void deleteTable(Text tableName)'
-  print '  Bytes get(Text tableName, Text row, Text column)'
-  print '   getVer(Text tableName, Text row, Text column, i32 numVersions)'
-  print '   getVerTs(Text tableName, Text row, Text column, i64 timestamp, i32 numVersions)'
-  print '   getRow(Text tableName, Text row)'
-  print '   getRowTs(Text tableName, Text row, i64 timestamp)'
-  print '  void put(Text tableName, Text row, Text column, Bytes value)'
-  print '  void mutateRow(Text tableName, Text row,  mutations)'
-  print '  void mutateRowTs(Text tableName, Text row,  mutations, i64 timestamp)'
-  print '  void mutateRows(Text tableName,  rowBatches)'
-  print '  void mutateRowsTs(Text tableName,  rowBatches, i64 timestamp)'
-  print '  void deleteAll(Text tableName, Text row, Text column)'
-  print '  void deleteAllTs(Text tableName, Text row, Text column, i64 timestamp)'
-  print '  void deleteAllRow(Text tableName, Text row)'
-  print '  void deleteAllRowTs(Text tableName, Text row, i64 timestamp)'
-  print '  ScannerID scannerOpen(Text tableName, Text startRow,  columns)'
-  print '  ScannerID scannerOpenWithStop(Text tableName, Text startRow, Text stopRow,  columns)'
-  print '  ScannerID scannerOpenTs(Text tableName, Text startRow,  columns, i64 timestamp)'
-  print '  ScannerID scannerOpenWithStopTs(Text tableName, Text startRow, Text stopRow,  columns, i64 timestamp)'
-  print '  ScanEntry scannerGet(ScannerID id)'
-  print '  void scannerClose(ScannerID id)'
-  print ''
-  sys.exit(0)
-
-pp = pprint.PrettyPrinter(indent = 2)
-host = 'localhost'
-port = 9090
-uri = ''
-framed = False
-http = False
-argi = 1
-
-if sys.argv[argi] == '-h':
-  parts = sys.argv[argi+1].split(':') 
-  host = parts[0]
-  port = int(parts[1])
-  argi += 2
-
-if sys.argv[argi] == '-u':
-  url = urlparse(sys.argv[argi+1])
-  parts = url[1].split(':') 
-  host = parts[0]
-  if len(parts) > 1:
-    port = int(parts[1])
-  else:
-    port = 80
-  uri = url[2]
-  http = True
-  argi += 2
-
-if sys.argv[argi] == '-f' or sys.argv[argi] == '-framed':
-  framed = True
-  argi += 1
-
-cmd = sys.argv[argi]
-args = sys.argv[argi+1:]
-
-if http:
-  transport = THttpClient.THttpClient(host, port, uri)
-else:
-  socket = TSocket.TSocket(host, port)
-  if framed:
-    transport = TTransport.TFramedTransport(socket)
-  else:
-    transport = TTransport.TBufferedTransport(socket)
-protocol = TBinaryProtocol.TBinaryProtocol(transport)
-client = Hbase.Client(protocol)
-transport.open()
-
-if cmd == 'getTableNames':
-  if len(args) != 0:
-    print 'getTableNames requires 0 args'
-    sys.exit(1)
-  pp.pprint(client.getTableNames())
-
-elif cmd == 'getColumnDescriptors':
-  if len(args) != 1:
-    print 'getColumnDescriptors requires 1 args'
-    sys.exit(1)
-  pp.pprint(client.getColumnDescriptors(eval(args[0]),))
-
-elif cmd == 'getTableRegions':
-  if len(args) != 1:
-    print 'getTableRegions requires 1 args'
-    sys.exit(1)
-  pp.pprint(client.getTableRegions(eval(args[0]),))
-
-elif cmd == 'createTable':
-  if len(args) != 2:
-    print 'createTable requires 2 args'
-    sys.exit(1)
-  pp.pprint(client.createTable(eval(args[0]),eval(args[1]),))
-
-elif cmd == 'deleteTable':
-  if len(args) != 1:
-    print 'deleteTable requires 1 args'
-    sys.exit(1)
-  pp.pprint(client.deleteTable(eval(args[0]),))
-
-elif cmd == 'get':
-  if len(args) != 3:
-    print 'get requires 3 args'
-    sys.exit(1)
-  pp.pprint(client.get(eval(args[0]),eval(args[1]),eval(args[2]),))
-
-elif cmd == 'getVer':
-  if len(args) != 4:
-    print 'getVer requires 4 args'
-    sys.exit(1)
-  pp.pprint(client.getVer(eval(args[0]),eval(args[1]),eval(args[2]),eval(args[3]),))
-
-elif cmd == 'getVerTs':
-  if len(args) != 5:
-    print 'getVerTs requires 5 args'
-    sys.exit(1)
-  pp.pprint(client.getVerTs(eval(args[0]),eval(args[1]),eval(args[2]),eval(args[3]),eval(args[4]),))
-
-elif cmd == 'getRow':
-  if len(args) != 2:
-    print 'getRow requires 2 args'
-    sys.exit(1)
-  pp.pprint(client.getRow(eval(args[0]),eval(args[1]),))
-
-elif cmd == 'getRowTs':
-  if len(args) != 3:
-    print 'getRowTs requires 3 args'
-    sys.exit(1)
-  pp.pprint(client.getRowTs(eval(args[0]),eval(args[1]),eval(args[2]),))
-
-elif cmd == 'put':
-  if len(args) != 4:
-    print 'put requires 4 args'
-    sys.exit(1)
-  pp.pprint(client.put(eval(args[0]),eval(args[1]),eval(args[2]),eval(args[3]),))
-
-elif cmd == 'mutateRow':
-  if len(args) != 3:
-    print 'mutateRow requires 3 args'
-    sys.exit(1)
-  pp.pprint(client.mutateRow(eval(args[0]),eval(args[1]),eval(args[2]),))
-
-elif cmd == 'mutateRowTs':
-  if len(args) != 4:
-    print 'mutateRowTs requires 4 args'
-    sys.exit(1)
-  pp.pprint(client.mutateRowTs(eval(args[0]),eval(args[1]),eval(args[2]),eval(args[3]),))
-
-elif cmd == 'mutateRows':
-  if len(args) != 2:
-    print 'mutateRows requires 2 args'
-    sys.exit(1)
-  pp.pprint(client.mutateRows(eval(args[0]),eval(args[1]),))
-
-elif cmd == 'mutateRowsTs':
-  if len(args) != 3:
-    print 'mutateRowsTs requires 3 args'
-    sys.exit(1)
-  pp.pprint(client.mutateRowsTs(eval(args[0]),eval(args[1]),eval(args[2]),))
-
-elif cmd == 'deleteAll':
-  if len(args) != 3:
-    print 'deleteAll requires 3 args'
-    sys.exit(1)
-  pp.pprint(client.deleteAll(eval(args[0]),eval(args[1]),eval(args[2]),))
-
-elif cmd == 'deleteAllTs':
-  if len(args) != 4:
-    print 'deleteAllTs requires 4 args'
-    sys.exit(1)
-  pp.pprint(client.deleteAllTs(eval(args[0]),eval(args[1]),eval(args[2]),eval(args[3]),))
-
-elif cmd == 'deleteAllRow':
-  if len(args) != 2:
-    print 'deleteAllRow requires 2 args'
-    sys.exit(1)
-  pp.pprint(client.deleteAllRow(eval(args[0]),eval(args[1]),))
-
-elif cmd == 'deleteAllRowTs':
-  if len(args) != 3:
-    print 'deleteAllRowTs requires 3 args'
-    sys.exit(1)
-  pp.pprint(client.deleteAllRowTs(eval(args[0]),eval(args[1]),eval(args[2]),))
-
-elif cmd == 'scannerOpen':
-  if len(args) != 3:
-    print 'scannerOpen requires 3 args'
-    sys.exit(1)
-  pp.pprint(client.scannerOpen(eval(args[0]),eval(args[1]),eval(args[2]),))
-
-elif cmd == 'scannerOpenWithStop':
-  if len(args) != 4:
-    print 'scannerOpenWithStop requires 4 args'
-    sys.exit(1)
-  pp.pprint(client.scannerOpenWithStop(eval(args[0]),eval(args[1]),eval(args[2]),eval(args[3]),))
-
-elif cmd == 'scannerOpenTs':
-  if len(args) != 4:
-    print 'scannerOpenTs requires 4 args'
-    sys.exit(1)
-  pp.pprint(client.scannerOpenTs(eval(args[0]),eval(args[1]),eval(args[2]),eval(args[3]),))
-
-elif cmd == 'scannerOpenWithStopTs':
-  if len(args) != 5:
-    print 'scannerOpenWithStopTs requires 5 args'
-    sys.exit(1)
-  pp.pprint(client.scannerOpenWithStopTs(eval(args[0]),eval(args[1]),eval(args[2]),eval(args[3]),eval(args[4]),))
-
-elif cmd == 'scannerGet':
-  if len(args) != 1:
-    print 'scannerGet requires 1 args'
-    sys.exit(1)
-  pp.pprint(client.scannerGet(eval(args[0]),))
-
-elif cmd == 'scannerClose':
-  if len(args) != 1:
-    print 'scannerClose requires 1 args'
-    sys.exit(1)
-  pp.pprint(client.scannerClose(eval(args[0]),))
-
-transport.close()
--- a/src/examples/uploaders/hbrep/Hbase/Hbase.py
+++ b/src/examples/uploaders/hbrep/Hbase/Hbase.py
--- a/src/examples/uploaders/hbrep/Hbase/init.py
+++ b/src/examples/uploaders/hbrep/Hbase/init.py
@ -1 +0,0 @@
-__all__ = ['ttypes', 'constants', 'Hbase']
--- a/src/examples/uploaders/hbrep/Hbase/constants.py
+++ b/src/examples/uploaders/hbrep/Hbase/constants.py
@ -1,9 +0,0 @@
-#
-# Autogenerated by Thrift
-#
-# DO NOT EDIT UNLESS YOU ARE SURE THAT YOU KNOW WHAT YOU ARE DOING
-#
-
-from thrift.Thrift import *
-from ttypes import *
-
--- a/src/examples/uploaders/hbrep/Hbase/ttypes.py
+++ b/src/examples/uploaders/hbrep/Hbase/ttypes.py
@ -1,708 +0,0 @@
-#
-# Autogenerated by Thrift
-#
-# DO NOT EDIT UNLESS YOU ARE SURE THAT YOU KNOW WHAT YOU ARE DOING
-#
-
-from thrift.Thrift import *
-
-from thrift.transport import TTransport
-from thrift.protocol import TBinaryProtocol
-try:
-  from thrift.protocol import fastbinary
-except:
-  fastbinary = None
-
-
-class ColumnDescriptor:
-
-  thrift_spec = (
-    None, # 0
-    (1, TType.STRING, 'name', None, None, ), # 1
-    (2, TType.I32, 'maxVersions', None, None, ), # 2
-    (3, TType.STRING, 'compression', None, None, ), # 3
-    (4, TType.BOOL, 'inMemory', None, None, ), # 4
-    (5, TType.I32, 'maxValueLength', None, None, ), # 5
-    (6, TType.STRING, 'bloomFilterType', None, None, ), # 6
-    (7, TType.I32, 'bloomFilterVectorSize', None, None, ), # 7
-    (8, TType.I32, 'bloomFilterNbHashes', None, None, ), # 8
-    (9, TType.BOOL, 'blockCacheEnabled', None, None, ), # 9
-    (10, TType.I32, 'timeToLive', None, None, ), # 10
-  )
-
-  def __init__(self, d=None):
-    self.name = None
-    self.maxVersions = 3
-    self.compression = 'NONE'
-    self.inMemory = False
-    self.maxValueLength = 2147483647
-    self.bloomFilterType = 'NONE'
-    self.bloomFilterVectorSize = 0
-    self.bloomFilterNbHashes = 0
-    self.blockCacheEnabled = False
-    self.timeToLive = -1
-    if isinstance(d, dict):
-      if 'name' in d:
-        self.name = d['name']
-      if 'maxVersions' in d:
-        self.maxVersions = d['maxVersions']
-      if 'compression' in d:
-        self.compression = d['compression']
-      if 'inMemory' in d:
-        self.inMemory = d['inMemory']
-      if 'maxValueLength' in d:
-        self.maxValueLength = d['maxValueLength']
-      if 'bloomFilterType' in d:
-        self.bloomFilterType = d['bloomFilterType']
-      if 'bloomFilterVectorSize' in d:
-        self.bloomFilterVectorSize = d['bloomFilterVectorSize']
-      if 'bloomFilterNbHashes' in d:
-        self.bloomFilterNbHashes = d['bloomFilterNbHashes']
-      if 'blockCacheEnabled' in d:
-        self.blockCacheEnabled = d['blockCacheEnabled']
-      if 'timeToLive' in d:
-        self.timeToLive = d['timeToLive']
-
-  def read(self, iprot):
-    if iprot.__class__ == TBinaryProtocol.TBinaryProtocolAccelerated and isinstance(iprot.trans, TTransport.CReadableTransport) and self.thrift_spec is not None and fastbinary is not None:
-      fastbinary.decode_binary(self, iprot.trans, (self.__class__, self.thrift_spec))
-      return
-    iprot.readStructBegin()
-    while True:
-      (fname, ftype, fid) = iprot.readFieldBegin()
-      if ftype == TType.STOP:
-        break
-      if fid == 1:
-        if ftype == TType.STRING:
-          self.name = iprot.readString();
-        else:
-          iprot.skip(ftype)
-      elif fid == 2:
-        if ftype == TType.I32:
-          self.maxVersions = iprot.readI32();
-        else:
-          iprot.skip(ftype)
-      elif fid == 3:
-        if ftype == TType.STRING:
-          self.compression = iprot.readString();
-        else:
-          iprot.skip(ftype)
-      elif fid == 4:
-        if ftype == TType.BOOL:
-          self.inMemory = iprot.readBool();
-        else:
-          iprot.skip(ftype)
-      elif fid == 5:
-        if ftype == TType.I32:
-          self.maxValueLength = iprot.readI32();
-        else:
-          iprot.skip(ftype)
-      elif fid == 6:
-        if ftype == TType.STRING:
-          self.bloomFilterType = iprot.readString();
-        else:
-          iprot.skip(ftype)
-      elif fid == 7:
-        if ftype == TType.I32:
-          self.bloomFilterVectorSize = iprot.readI32();
-        else:
-          iprot.skip(ftype)
-      elif fid == 8:
-        if ftype == TType.I32:
-          self.bloomFilterNbHashes = iprot.readI32();
-        else:
-          iprot.skip(ftype)
-      elif fid == 9:
-        if ftype == TType.BOOL:
-          self.blockCacheEnabled = iprot.readBool();
-        else:
-          iprot.skip(ftype)
-      elif fid == 10:
-        if ftype == TType.I32:
-          self.timeToLive = iprot.readI32();
-        else:
-          iprot.skip(ftype)
-      else:
-        iprot.skip(ftype)
-      iprot.readFieldEnd()
-    iprot.readStructEnd()
-
-  def write(self, oprot):
-    if oprot.__class__ == TBinaryProtocol.TBinaryProtocolAccelerated and self.thrift_spec is not None and fastbinary is not None:
-      oprot.trans.write(fastbinary.encode_binary(self, (self.__class__, self.thrift_spec)))
-      return
-    oprot.writeStructBegin('ColumnDescriptor')
-    if self.name != None:
-      oprot.writeFieldBegin('name', TType.STRING, 1)
-      oprot.writeString(self.name)
-      oprot.writeFieldEnd()
-    if self.maxVersions != None:
-      oprot.writeFieldBegin('maxVersions', TType.I32, 2)
-      oprot.writeI32(self.maxVersions)
-      oprot.writeFieldEnd()
-    if self.compression != None:
-      oprot.writeFieldBegin('compression', TType.STRING, 3)
-      oprot.writeString(self.compression)
-      oprot.writeFieldEnd()
-    if self.inMemory != None:
-      oprot.writeFieldBegin('inMemory', TType.BOOL, 4)
-      oprot.writeBool(self.inMemory)
-      oprot.writeFieldEnd()
-    if self.maxValueLength != None:
-      oprot.writeFieldBegin('maxValueLength', TType.I32, 5)
-      oprot.writeI32(self.maxValueLength)
-      oprot.writeFieldEnd()
-    if self.bloomFilterType != None:
-      oprot.writeFieldBegin('bloomFilterType', TType.STRING, 6)
-      oprot.writeString(self.bloomFilterType)
-      oprot.writeFieldEnd()
-    if self.bloomFilterVectorSize != None:
-      oprot.writeFieldBegin('bloomFilterVectorSize', TType.I32, 7)
-      oprot.writeI32(self.bloomFilterVectorSize)
-      oprot.writeFieldEnd()
-    if self.bloomFilterNbHashes != None:
-      oprot.writeFieldBegin('bloomFilterNbHashes', TType.I32, 8)
-      oprot.writeI32(self.bloomFilterNbHashes)
-      oprot.writeFieldEnd()
-    if self.blockCacheEnabled != None:
-      oprot.writeFieldBegin('blockCacheEnabled', TType.BOOL, 9)
-      oprot.writeBool(self.blockCacheEnabled)
-      oprot.writeFieldEnd()
-    if self.timeToLive != None:
-      oprot.writeFieldBegin('timeToLive', TType.I32, 10)
-      oprot.writeI32(self.timeToLive)
-      oprot.writeFieldEnd()
-    oprot.writeFieldStop()
-    oprot.writeStructEnd()
-
-  def __str__(self): 
-    return str(self.__dict__)
-
-  def __repr__(self): 
-    return repr(self.__dict__)
-
-  def __eq__(self, other):
-    return isinstance(other, self.__class__) and self.__dict__ == other.__dict__
-
-  def __ne__(self, other):
-    return not (self == other)
-
-class RegionDescriptor:
-
-  thrift_spec = (
-    None, # 0
-    (1, TType.STRING, 'startKey', None, None, ), # 1
-  )
-
-  def __init__(self, d=None):
-    self.startKey = None
-    if isinstance(d, dict):
-      if 'startKey' in d:
-        self.startKey = d['startKey']
-
-  def read(self, iprot):
-    if iprot.__class__ == TBinaryProtocol.TBinaryProtocolAccelerated and isinstance(iprot.trans, TTransport.CReadableTransport) and self.thrift_spec is not None and fastbinary is not None:
-      fastbinary.decode_binary(self, iprot.trans, (self.__class__, self.thrift_spec))
-      return
-    iprot.readStructBegin()
-    while True:
-      (fname, ftype, fid) = iprot.readFieldBegin()
-      if ftype == TType.STOP:
-        break
-      if fid == 1:
-        if ftype == TType.STRING:
-          self.startKey = iprot.readString();
-        else:
-          iprot.skip(ftype)
-      else:
-        iprot.skip(ftype)
-      iprot.readFieldEnd()
-    iprot.readStructEnd()
-
-  def write(self, oprot):
-    if oprot.__class__ == TBinaryProtocol.TBinaryProtocolAccelerated and self.thrift_spec is not None and fastbinary is not None:
-      oprot.trans.write(fastbinary.encode_binary(self, (self.__class__, self.thrift_spec)))
-      return
-    oprot.writeStructBegin('RegionDescriptor')
-    if self.startKey != None:
-      oprot.writeFieldBegin('startKey', TType.STRING, 1)
-      oprot.writeString(self.startKey)
-      oprot.writeFieldEnd()
-    oprot.writeFieldStop()
-    oprot.writeStructEnd()
-
-  def __str__(self): 
-    return str(self.__dict__)
-
-  def __repr__(self): 
-    return repr(self.__dict__)
-
-  def __eq__(self, other):
-    return isinstance(other, self.__class__) and self.__dict__ == other.__dict__
-
-  def __ne__(self, other):
-    return not (self == other)
-
-class Mutation:
-
-  thrift_spec = (
-    None, # 0
-    (1, TType.BOOL, 'isDelete', None, None, ), # 1
-    (2, TType.STRING, 'column', None, None, ), # 2
-    (3, TType.STRING, 'value', None, None, ), # 3
-  )
-
-  def __init__(self, d=None):
-    self.isDelete = False
-    self.column = None
-    self.value = None
-    if isinstance(d, dict):
-      if 'isDelete' in d:
-        self.isDelete = d['isDelete']
-      if 'column' in d:
-        self.column = d['column']
-      if 'value' in d:
-        self.value = d['value']
-
-  def read(self, iprot):
-    if iprot.__class__ == TBinaryProtocol.TBinaryProtocolAccelerated and isinstance(iprot.trans, TTransport.CReadableTransport) and self.thrift_spec is not None and fastbinary is not None:
-      fastbinary.decode_binary(self, iprot.trans, (self.__class__, self.thrift_spec))
-      return
-    iprot.readStructBegin()
-    while True:
-      (fname, ftype, fid) = iprot.readFieldBegin()
-      if ftype == TType.STOP:
-        break
-      if fid == 1:
-        if ftype == TType.BOOL:
-          self.isDelete = iprot.readBool();
-        else:
-          iprot.skip(ftype)
-      elif fid == 2:
-        if ftype == TType.STRING:
-          self.column = iprot.readString();
-        else:
-          iprot.skip(ftype)
-      elif fid == 3:
-        if ftype == TType.STRING:
-          self.value = iprot.readString();
-        else:
-          iprot.skip(ftype)
-      else:
-        iprot.skip(ftype)
-      iprot.readFieldEnd()
-    iprot.readStructEnd()
-
-  def write(self, oprot):
-    if oprot.__class__ == TBinaryProtocol.TBinaryProtocolAccelerated and self.thrift_spec is not None and fastbinary is not None:
-      oprot.trans.write(fastbinary.encode_binary(self, (self.__class__, self.thrift_spec)))
-      return
-    oprot.writeStructBegin('Mutation')
-    if self.isDelete != None:
-      oprot.writeFieldBegin('isDelete', TType.BOOL, 1)
-      oprot.writeBool(self.isDelete)
-      oprot.writeFieldEnd()
-    if self.column != None:
-      oprot.writeFieldBegin('column', TType.STRING, 2)
-      oprot.writeString(self.column)
-      oprot.writeFieldEnd()
-    if self.value != None:
-      oprot.writeFieldBegin('value', TType.STRING, 3)
-      oprot.writeString(self.value)
-      oprot.writeFieldEnd()
-    oprot.writeFieldStop()
-    oprot.writeStructEnd()
-
-  def __str__(self): 
-    return str(self.__dict__)
-
-  def __repr__(self): 
-    return repr(self.__dict__)
-
-  def __eq__(self, other):
-    return isinstance(other, self.__class__) and self.__dict__ == other.__dict__
-
-  def __ne__(self, other):
-    return not (self == other)
-
-class BatchMutation:
-
-  thrift_spec = (
-    None, # 0
-    (1, TType.STRING, 'row', None, None, ), # 1
-    (2, TType.LIST, 'mutations', (TType.STRUCT,(Mutation, Mutation.thrift_spec)), None, ), # 2
-  )
-
-  def __init__(self, d=None):
-    self.row = None
-    self.mutations = None
-    if isinstance(d, dict):
-      if 'row' in d:
-        self.row = d['row']
-      if 'mutations' in d:
-        self.mutations = d['mutations']
-
-  def read(self, iprot):
-    if iprot.__class__ == TBinaryProtocol.TBinaryProtocolAccelerated and isinstance(iprot.trans, TTransport.CReadableTransport) and self.thrift_spec is not None and fastbinary is not None:
-      fastbinary.decode_binary(self, iprot.trans, (self.__class__, self.thrift_spec))
-      return
-    iprot.readStructBegin()
-    while True:
-      (fname, ftype, fid) = iprot.readFieldBegin()
-      if ftype == TType.STOP:
-        break
-      if fid == 1:
-        if ftype == TType.STRING:
-          self.row = iprot.readString();
-        else:
-          iprot.skip(ftype)
-      elif fid == 2:
-        if ftype == TType.LIST:
-          self.mutations = []
-          (_etype3, _size0) = iprot.readListBegin()
-          for _i4 in xrange(_size0):
-            _elem5 = Mutation()
-            _elem5.read(iprot)
-            self.mutations.append(_elem5)
-          iprot.readListEnd()
-        else:
-          iprot.skip(ftype)
-      else:
-        iprot.skip(ftype)
-      iprot.readFieldEnd()
-    iprot.readStructEnd()
-
-  def write(self, oprot):
-    if oprot.__class__ == TBinaryProtocol.TBinaryProtocolAccelerated and self.thrift_spec is not None and fastbinary is not None:
-      oprot.trans.write(fastbinary.encode_binary(self, (self.__class__, self.thrift_spec)))
-      return
-    oprot.writeStructBegin('BatchMutation')
-    if self.row != None:
-      oprot.writeFieldBegin('row', TType.STRING, 1)
-      oprot.writeString(self.row)
-      oprot.writeFieldEnd()
-    if self.mutations != None:
-      oprot.writeFieldBegin('mutations', TType.LIST, 2)
-      oprot.writeListBegin(TType.STRUCT, len(self.mutations))
-      for iter6 in self.mutations:
-        iter6.write(oprot)
-      oprot.writeListEnd()
-      oprot.writeFieldEnd()
-    oprot.writeFieldStop()
-    oprot.writeStructEnd()
-
-  def __str__(self): 
-    return str(self.__dict__)
-
-  def __repr__(self): 
-    return repr(self.__dict__)
-
-  def __eq__(self, other):
-    return isinstance(other, self.__class__) and self.__dict__ == other.__dict__
-
-  def __ne__(self, other):
-    return not (self == other)
-
-class ScanEntry:
-
-  thrift_spec = (
-    None, # 0
-    (1, TType.STRING, 'row', None, None, ), # 1
-    (2, TType.MAP, 'columns', (TType.STRING,None,TType.STRING,None), None, ), # 2
-  )
-
-  def __init__(self, d=None):
-    self.row = None
-    self.columns = None
-    if isinstance(d, dict):
-      if 'row' in d:
-        self.row = d['row']
-      if 'columns' in d:
-        self.columns = d['columns']
-
-  def read(self, iprot):
-    if iprot.__class__ == TBinaryProtocol.TBinaryProtocolAccelerated and isinstance(iprot.trans, TTransport.CReadableTransport) and self.thrift_spec is not None and fastbinary is not None:
-      fastbinary.decode_binary(self, iprot.trans, (self.__class__, self.thrift_spec))
-      return
-    iprot.readStructBegin()
-    while True:
-      (fname, ftype, fid) = iprot.readFieldBegin()
-      if ftype == TType.STOP:
-        break
-      if fid == 1:
-        if ftype == TType.STRING:
-          self.row = iprot.readString();
-        else:
-          iprot.skip(ftype)
-      elif fid == 2:
-        if ftype == TType.MAP:
-          self.columns = {}
-          (_ktype8, _vtype9, _size7 ) = iprot.readMapBegin() 
-          for _i11 in xrange(_size7):
-            _key12 = iprot.readString();
-            _val13 = iprot.readString();
-            self.columns[_key12] = _val13
-          iprot.readMapEnd()
-        else:
-          iprot.skip(ftype)
-      else:
-        iprot.skip(ftype)
-      iprot.readFieldEnd()
-    iprot.readStructEnd()
-
-  def write(self, oprot):
-    if oprot.__class__ == TBinaryProtocol.TBinaryProtocolAccelerated and self.thrift_spec is not None and fastbinary is not None:
-      oprot.trans.write(fastbinary.encode_binary(self, (self.__class__, self.thrift_spec)))
-      return
-    oprot.writeStructBegin('ScanEntry')
-    if self.row != None:
-      oprot.writeFieldBegin('row', TType.STRING, 1)
-      oprot.writeString(self.row)
-      oprot.writeFieldEnd()
-    if self.columns != None:
-      oprot.writeFieldBegin('columns', TType.MAP, 2)
-      oprot.writeMapBegin(TType.STRING, TType.STRING, len(self.columns))
-      for kiter14,viter15 in self.columns.items():
-        oprot.writeString(kiter14)
-        oprot.writeString(viter15)
-      oprot.writeMapEnd()
-      oprot.writeFieldEnd()
-    oprot.writeFieldStop()
-    oprot.writeStructEnd()
-
-  def __str__(self): 
-    return str(self.__dict__)
-
-  def __repr__(self): 
-    return repr(self.__dict__)
-
-  def __eq__(self, other):
-    return isinstance(other, self.__class__) and self.__dict__ == other.__dict__
-
-  def __ne__(self, other):
-    return not (self == other)
-
-class IOError(Exception):
-
-  thrift_spec = (
-    None, # 0
-    (1, TType.STRING, 'message', None, None, ), # 1
-  )
-
-  def __init__(self, d=None):
-    self.message = None
-    if isinstance(d, dict):
-      if 'message' in d:
-        self.message = d['message']
-
-  def read(self, iprot):
-    if iprot.__class__ == TBinaryProtocol.TBinaryProtocolAccelerated and isinstance(iprot.trans, TTransport.CReadableTransport) and self.thrift_spec is not None and fastbinary is not None:
-      fastbinary.decode_binary(self, iprot.trans, (self.__class__, self.thrift_spec))
-      return
-    iprot.readStructBegin()
-    while True:
-      (fname, ftype, fid) = iprot.readFieldBegin()
-      if ftype == TType.STOP:
-        break
-      if fid == 1:
-        if ftype == TType.STRING:
-          self.message = iprot.readString();
-        else:
-          iprot.skip(ftype)
-      else:
-        iprot.skip(ftype)
-      iprot.readFieldEnd()
-    iprot.readStructEnd()
-
-  def write(self, oprot):
-    if oprot.__class__ == TBinaryProtocol.TBinaryProtocolAccelerated and self.thrift_spec is not None and fastbinary is not None:
-      oprot.trans.write(fastbinary.encode_binary(self, (self.__class__, self.thrift_spec)))
-      return
-    oprot.writeStructBegin('IOError')
-    if self.message != None:
-      oprot.writeFieldBegin('message', TType.STRING, 1)
-      oprot.writeString(self.message)
-      oprot.writeFieldEnd()
-    oprot.writeFieldStop()
-    oprot.writeStructEnd()
-
-  def __str__(self): 
-    return str(self.__dict__)
-
-  def __repr__(self): 
-    return repr(self.__dict__)
-
-  def __eq__(self, other):
-    return isinstance(other, self.__class__) and self.__dict__ == other.__dict__
-
-  def __ne__(self, other):
-    return not (self == other)
-
-class IllegalArgument(Exception):
-
-  thrift_spec = (
-    None, # 0
-    (1, TType.STRING, 'message', None, None, ), # 1
-  )
-
-  def __init__(self, d=None):
-    self.message = None
-    if isinstance(d, dict):
-      if 'message' in d:
-        self.message = d['message']
-
-  def read(self, iprot):
-    if iprot.__class__ == TBinaryProtocol.TBinaryProtocolAccelerated and isinstance(iprot.trans, TTransport.CReadableTransport) and self.thrift_spec is not None and fastbinary is not None:
-      fastbinary.decode_binary(self, iprot.trans, (self.__class__, self.thrift_spec))
-      return
-    iprot.readStructBegin()
-    while True:
-      (fname, ftype, fid) = iprot.readFieldBegin()
-      if ftype == TType.STOP:
-        break
-      if fid == 1:
-        if ftype == TType.STRING:
-          self.message = iprot.readString();
-        else:
-          iprot.skip(ftype)
-      else:
-        iprot.skip(ftype)
-      iprot.readFieldEnd()
-    iprot.readStructEnd()
-
-  def write(self, oprot):
-    if oprot.__class__ == TBinaryProtocol.TBinaryProtocolAccelerated and self.thrift_spec is not None and fastbinary is not None:
-      oprot.trans.write(fastbinary.encode_binary(self, (self.__class__, self.thrift_spec)))
-      return
-    oprot.writeStructBegin('IllegalArgument')
-    if self.message != None:
-      oprot.writeFieldBegin('message', TType.STRING, 1)
-      oprot.writeString(self.message)
-      oprot.writeFieldEnd()
-    oprot.writeFieldStop()
-    oprot.writeStructEnd()
-
-  def __str__(self): 
-    return str(self.__dict__)
-
-  def __repr__(self): 
-    return repr(self.__dict__)
-
-  def __eq__(self, other):
-    return isinstance(other, self.__class__) and self.__dict__ == other.__dict__
-
-  def __ne__(self, other):
-    return not (self == other)
-
-class NotFound(Exception):
-
-  thrift_spec = (
-    None, # 0
-    (1, TType.STRING, 'message', None, None, ), # 1
-  )
-
-  def __init__(self, d=None):
-    self.message = None
-    if isinstance(d, dict):
-      if 'message' in d:
-        self.message = d['message']
-
-  def read(self, iprot):
-    if iprot.__class__ == TBinaryProtocol.TBinaryProtocolAccelerated and isinstance(iprot.trans, TTransport.CReadableTransport) and self.thrift_spec is not None and fastbinary is not None:
-      fastbinary.decode_binary(self, iprot.trans, (self.__class__, self.thrift_spec))
-      return
-    iprot.readStructBegin()
-    while True:
-      (fname, ftype, fid) = iprot.readFieldBegin()
-      if ftype == TType.STOP:
-        break
-      if fid == 1:
-        if ftype == TType.STRING:
-          self.message = iprot.readString();
-        else:
-          iprot.skip(ftype)
-      else:
-        iprot.skip(ftype)
-      iprot.readFieldEnd()
-    iprot.readStructEnd()
-
-  def write(self, oprot):
-    if oprot.__class__ == TBinaryProtocol.TBinaryProtocolAccelerated and self.thrift_spec is not None and fastbinary is not None:
-      oprot.trans.write(fastbinary.encode_binary(self, (self.__class__, self.thrift_spec)))
-      return
-    oprot.writeStructBegin('NotFound')
-    if self.message != None:
-      oprot.writeFieldBegin('message', TType.STRING, 1)
-      oprot.writeString(self.message)
-      oprot.writeFieldEnd()
-    oprot.writeFieldStop()
-    oprot.writeStructEnd()
-
-  def __str__(self): 
-    return str(self.__dict__)
-
-  def __repr__(self): 
-    return repr(self.__dict__)
-
-  def __eq__(self, other):
-    return isinstance(other, self.__class__) and self.__dict__ == other.__dict__
-
-  def __ne__(self, other):
-    return not (self == other)
-
-class AlreadyExists(Exception):
-
-  thrift_spec = (
-    None, # 0
-    (1, TType.STRING, 'message', None, None, ), # 1
-  )
-
-  def __init__(self, d=None):
-    self.message = None
-    if isinstance(d, dict):
-      if 'message' in d:
-        self.message = d['message']
-
-  def read(self, iprot):
-    if iprot.__class__ == TBinaryProtocol.TBinaryProtocolAccelerated and isinstance(iprot.trans, TTransport.CReadableTransport) and self.thrift_spec is not None and fastbinary is not None:
-      fastbinary.decode_binary(self, iprot.trans, (self.__class__, self.thrift_spec))
-      return
-    iprot.readStructBegin()
-    while True:
-      (fname, ftype, fid) = iprot.readFieldBegin()
-      if ftype == TType.STOP:
-        break
-      if fid == 1:
-        if ftype == TType.STRING:
-          self.message = iprot.readString();
-        else:
-          iprot.skip(ftype)
-      else:
-        iprot.skip(ftype)
-      iprot.readFieldEnd()
-    iprot.readStructEnd()
-
-  def write(self, oprot):
-    if oprot.__class__ == TBinaryProtocol.TBinaryProtocolAccelerated and self.thrift_spec is not None and fastbinary is not None:
-      oprot.trans.write(fastbinary.encode_binary(self, (self.__class__, self.thrift_spec)))
-      return
-    oprot.writeStructBegin('AlreadyExists')
-    if self.message != None:
-      oprot.writeFieldBegin('message', TType.STRING, 1)
-      oprot.writeString(self.message)
-      oprot.writeFieldEnd()
-    oprot.writeFieldStop()
-    oprot.writeStructEnd()
-
-  def __str__(self): 
-    return str(self.__dict__)
-
-  def __repr__(self): 
-    return repr(self.__dict__)
-
-  def __eq__(self, other):
-    return isinstance(other, self.__class__) and self.__dict__ == other.__dict__
-
-  def __ne__(self, other):
-    return not (self == other)
-
--- a/src/examples/uploaders/hbrep/README
+++ b/src/examples/uploaders/hbrep/README
@ -1,107 +0,0 @@
-hbrep is a tool for replicating data from postgresql tables to hbase tables.
-
-Dependancies:
- - python 2.4
- - hbase 0.2.0
- - skytools 2.1.7
- - postgresql
- 
-It has two main functions.
- - bootstrap, which bootstraps all the data from specified columns of a table
- - play, which processes incoming insert, update and delete events and applies them to hbase.
-
-Example usage:
-install triggers:
-  ./hbrep.py hbrep.ini install schema1.table1 schema2.table2
-now that future updates are queuing, bootstrap the tables.
-  ./hbrep.py hbrep.ini bootstrap schema1.table1 schema2.table2
-start pgq ticker
-  pgqadm.py pgq.ini ticker
-play our queue consumer
-  ./hbrep.py hbrep.ini play schema1.table1 schema2.table2
-
-
-More details follow.
-
-
-All functions require an ini file (say hbrep.ini) with a HBaseReplic section, and a section for each postgresql table you wish to replicate containing the table mapping. Note the table mapping section names should match the name of the postgresql table.
-
-eg. ini file:
-####################
-[HBaseReplic]
-job_name = hbase_replic_job
-logfile = %(job_name)s.log
-pidfile = %(job_name)s.pid
-postgresql_db = dbname=source_database user=dbuser
-pgq_queue_name = hbase_replic_queue
-hbase_hostname = localhost
-hbase_port = 9090
-# If omitted, default is 10000
-max_batch_size = 10000
-# file to use when copying a table, if omitted a select columns will be done instead.
-bootstrap_tmpfile = tabledump.dat
-
-# For each table mapping, there must be the same number psql_columns as hbase_column_descriptors
-[public.users]
-psql_schema = public
-psql_table_name = users
-psql_key_column = user_id
-psql_columns = dob
-hbase_table_name = stuff
-hbase_column_descriptors = users:dob
-hbase_row_prefix = user_id:
-####################
-
-Bootstrapping:
-To bootstrap the public.users table from postgresql to hbase, 
-
-  ./hbrep.py hbrep.ini bootstrap public.users
-  
-you can specify multiple tables as arguments.
- 
- 
-Play:
-This mode uses pgq from the skytools package to create and manage event queues on postgresql.
-You need to have pgq installed on the database you are replicating.
-
-With a pgq.ini file like this:
-####################
-[pgqadm]
-job_name = sourcedb_ticker
-db = dbname=source_database user=dbuser
-# how often to run maintenance [minutes]
-maint_delay_min = 1
-# how often to check for activity [secs]
-loop_delay = 0.2
-logfile = %(job_name)s.log
-pidfile = %(job_name)s.pid
-use_skylog = 0
-####################
-
-You install pgq on the database by, 
-
-  pgqadm.py pgq.ini install
-
-Next you install hbrep.
-
-  hbrep.py hbrep.ini install public.users
-  
-This creates a queue using pgq, which in this case will be called hbase_replic_queue. It also registers the hbrep consumer (called HBaseReplic) with that queue. Then finally it creates triggers on each table specified to add an event for each insert, update or delete.
-
-Start the pgq event ticker,
-
-  pgqadm.py pgq.ini ticker
-
-Finally, run the hbreplic consumer
-  ./hbrep.py hbrep.ini play public.users
-  
-Now any inserts, updates or deletes on the postgresql users table will be processed and sent to the 
-hbase table.
-
-
-uninstall:
-You can remove the triggers from a table by
-  ./hbrep.py hbrep.ini uninstall public.users
-  
-  
-
--- a/src/examples/uploaders/hbrep/init.py
+++ b/src/examples/uploaders/hbrep/init.py
--- a/src/examples/uploaders/hbrep/bootstrap.py
+++ b/src/examples/uploaders/hbrep/bootstrap.py
@ -1,190 +0,0 @@
-import sys, os
-
-import pgq, pgq.producer
-import skytools
-
-from HBaseConnection import *
-import tablemapping
-
-class HBaseBootstrap(skytools.DBScript):
-  """Bootstrapping script for loading columns from a table in postgresql to hbase."""
-  
-  def __init__(self, service_name, args):
-    # This will process any options eg -k -v -d
-    skytools.DBScript.__init__(self, service_name, args)
-    
-    config_file = self.args[0]
-    if len(self.args) < 2:
-      print "need table names"
-      sys.exit(1)
-    else:
-      self.table_names = self.args[1:]
-    
-    #just to check this option exists
-    self.cf.get("postgresql_db")
-    
-    self.max_batch_size = int(self.cf.get("max_batch_size", "10000"))
-    self.hbase_hostname = self.cf.get("hbase_hostname", "localhost")
-    self.hbase_port = int(self.cf.get("hbase_port", "9090"))
-    self.table_mappings = tablemapping.load_table_mappings(config_file, self.table_names)
-  
-  def startup(self):
-    # make sure the script loops only once.
-    self.set_single_loop(1)
-    self.log.info("Starting " + self.job_name)
-    
-  def work(self):
-    for t in self.table_names:
-      self.bootstrap_table(t)
-      
-  def bootstrap_table(self, table_name):
-    try:
-      self.log.info("Bootstrapping table %s" % table_name)
-      hbase = HBaseConnection(self.hbase_hostname, self.hbase_port)
-      try:
-        table_mapping = self.table_mappings[table_name]
-      
-        self.log.debug("Connecting to HBase")
-        hbase.connect()
-        
-        # Fetch postgresql cursor
-        self.log.debug("Getting postgresql cursor")
-        db = self.get_database("postgresql_db")
-        curs = db.cursor()
-        
-        hbase.validate_table_name(table_mapping.hbase_table_name)
-        hbase.validate_column_descriptors(table_mapping.hbase_table_name, table_mapping.hbase_column_descriptors)
-        
-        try:
-          dump_file = self.cf.get("bootstrap_tmpfile")
-        except:
-          dump_file = None
-        
-        if dump_file != None:
-          row_source = CopiedRows(self.log, curs, dump_file)
-        else:
-          row_source = SelectedRows(self.log, curs)
-        
-        table_name = table_mapping.psql_schema+"."+table_mapping.psql_table_name
-        # we are careful to make sure that the first column will be the key.
-        column_list = [table_mapping.psql_key_column] + table_mapping.psql_columns
-        
-        # Load the rows either via a select or via a table copy to file. 
-        # Either way, it does not load it all into memory. 
-        # copy is faster, but may incorrectly handle data with tabs in it.
-        row_source.load_rows(table_name, column_list)
-        
-        # max number of rows to fetch at once
-        batch_size = self.max_batch_size
-        total_rows = 0L
-          
-        self.log.debug("Starting puts to hbase")
-        rows = row_source.get_rows(batch_size)
-        while rows != []:
-          batches = []
-          for row in rows:
-            batches.append(self.createRowBatch(table_mapping, row))
-          
-          hbase.client.mutateRows(table_mapping.hbase_table_name, batches)
-          total_rows = total_rows + len(batches)
-          self.log.debug("total rows put = %d" % (total_rows))
-          # get next batch of rows
-          rows = row_source.get_rows(batch_size)
-          
-        self.log.info("total rows put = %d" % (total_rows))
-        self.log.info("Bootstrapping table %s complete" % table_name)
-        
-        
-      except Exception, e:
-        #self.log.info(e)
-        sys.exit(e)
-      
-    finally:
-      hbase.disconnect()
-  
-  def createRowBatch(self, table_mapping, row):
-    batch = BatchMutation()
-    batch.row = table_mapping.hbase_row_prefix + str(row[0])
-    batch.mutations = []
-    for column, value in zip(table_mapping.hbase_column_descriptors, row[1:]):
-      if value != 'NULL' and  value != None:
-        m = Mutation()
-        m.column = column
-        m.value = str(value)
-        batch.mutations.append(m)
-    return batch
-  
-  
-## Helper classes to fetch rows from a select, or from a table dumped by copy
-  
-class RowSource:
-  """ Base class for fetching rows from somewhere. """
-  
-  def __init__(self, log):
-    self.log = log
-    
-  def make_column_str(self, column_list):
-    i = 0
-    while i < len(column_list):
-      column_list[i] = '"%s"' % column_list[i]
-      i += 1
-    return ",".join(column_list)
-  
-   
-class CopiedRows(RowSource):
-  """ 
-  Class for fetching rows from a postgresql database,
-  rows are dumped to a copied to a file first
-  """
-  def __init__(self, log, curs, dump_file):
-    RowSource.__init__(self, log)
-    self.dump_file = dump_file
-    # Set DBAPI-2.0 cursor
-    self.curs = curs
-    
-  def load_rows(self, table_name, column_list):
-    columns = self.make_column_str(column_list)
-    self.log.debug("starting dump to file:%s. table:%s. columns:%s" % (self.dump_file, table_name, columns))
-    dump_out = open(self.dump_file, 'w')
-    self.curs.copy_to(dump_out, table_name + "(%s)" % columns, '\t', 'NULL')
-    dump_out.close()
-    self.log.debug("table %s dump complete" % table_name)
-    
-    self.dump_in = open(self.dump_file, 'r')
-    
-  def get_rows(self, no_of_rows):
-    rows = []
-    if not self.dump_in.closed:
-      for line in self.dump_in:
-        rows.append(line.split())      
-        if len(rows) >= no_of_rows:
-          break
-      if rows == []:
-        self.dump_in.close()
-    return rows
-
-
-class SelectedRows(RowSource):
-  """ 
-  Class for fetching rows from a postgresql database,
-  rows are fetched via a select on the entire table.
-  """
-  def __init__(self, log, curs):
-    RowSource.__init__(self, log)
-    # Set DBAPI-2.0 cursor
-    self.curs = curs
-    
-  def load_rows(self, table_name, column_list):
-    columns = self.make_column_str(column_list)
-    q = "SELECT %s FROM %s" % (columns,table_name)
-    self.log.debug("Executing query %s" % q)
-    self.curs.execute(q)
-    self.log.debug("query finished")
-    
-  def get_rows(self, no_of_rows):
-    return self.curs.fetchmany(no_of_rows)
-    
-
-if __name__ == '__main__':
-  bootstrap = HBaseBootstrap("HBaseReplic",sys.argv[1:])
-  bootstrap.start()
--- a/src/examples/uploaders/hbrep/hbrep.ini
+++ b/src/examples/uploaders/hbrep/hbrep.ini
@ -1,22 +0,0 @@
-[HBaseReplic]
-job_name = hbase_replic_job
-logfile = %(job_name)s.log
-pidfile = %(job_name)s.pid
-postgresql_db = dbname=source_database user=dbuser
-pgq_queue_name = hbase_replic_queue
-hbase_hostname = localhost
-hbase_port = 9090
-# If omitted, default is 10000
-max_batch_size = 10000
-# file to use when copying a table, if omitted a select columns will be done instead.
-bootstrap_tmpfile = tabledump.dat
-
-# For each table mapping, there must be the same number psql_columns as hbase_column_descriptors
-[public.users]
-psql_schema = public
-psql_table_name = users
-psql_key_column = user_id
-psql_columns = dob
-hbase_table_name = stuff
-hbase_column_descriptors = users:dob
-hbase_row_prefix = user_id:
--- a/src/examples/uploaders/hbrep/hbrep.py
+++ b/src/examples/uploaders/hbrep/hbrep.py
@ -1,126 +0,0 @@
-#!/usr/bin/env python
-import sys, os
-
-import pgq, pgq.producer
-import skytools, skytools._pyquoting
-
-from bootstrap import HBaseBootstrap
-from HBaseConsumer import HBaseConsumer
-
-command_usage = """
-%prog [options] inifile command [tablenames]
-
-commands:
-  play          Run event consumer to update specified tables with hbase.
-  bootstrap     Bootstrap specified tables args into hbase.
-  install       Setup the pgq queue, and install trigger on each table.
-  uninstall     Remove the triggers from each specified table.
-"""
-
-class HBaseReplic(skytools.DBScript):
-  def __init__(self, service_name, args):
-    try:
-      self.run_script = 0
-      
-      # This will process any options eg -k -v -d
-      skytools.DBScript.__init__(self, service_name, args)
-      
-      self.config_file = self.args[0]
-      
-      if len(self.args) < 2:
-        self.print_usage()
-        print "need command"
-        sys.exit(0)
-      cmd = self.args[1]
-        
-      if not cmd in ["play","bootstrap","install", "uninstall"]:
-        self.print_usage()
-        print "unknown command"
-        sys.exit(0)
-        
-      if len(self.args) < 3:
-        self.print_usage()
-        print "need table names"
-        sys.exit(0)
-      else:
-        self.table_names = self.args[2:]
-      
-      if cmd == "play":
-        self.run_script = HBaseConsumer(service_name, [self.config_file] + self.table_names)
-      elif cmd == "bootstrap":
-        self.run_script = HBaseBootstrap(service_name, [self.config_file] + self.table_names)
-      elif cmd == "install":
-        self.work = self.do_install
-      elif cmd == "uninstall":
-        self.work = self.do_uninstall
-        
-    except Exception, e:
-      sys.exit(e)
-  
-  def print_usage(self):
-    print "Usage: " + command_usage
-    
-  def init_optparse(self, parser=None):
-    p = skytools.DBScript.init_optparse(self, parser)
-    p.set_usage(command_usage.strip())
-    return p
-
-  def start(self):
-    if self.run_script:
-      self.run_script.start()
-    else:
-      skytools.DBScript.start(self)
-      
-  def startup(self):
-    # make sure the script loops only once.
-    self.set_single_loop(1)
-    
-  def do_install(self):
-    try:
-      queue_name = self.cf.get("pgq_queue_name")
-      consumer = self.job_name
-      
-      self.log.info('Creating queue: %s' % queue_name)
-      self.exec_sql("select pgq.create_queue(%s)", [queue_name])
-  
-      self.log.info('Registering consumer %s on queue %s' % (consumer, queue_name))
-      self.exec_sql("select pgq.register_consumer(%s, %s)", [queue_name, consumer])
-  
-      for table_name in self.table_names:
-        self.log.info('Creating trigger hbase_replic on table %s' % (table_name))
-        q = """
-        CREATE TRIGGER hbase_replic
-          AFTER INSERT OR UPDATE OR DELETE
-          ON %s
-          FOR EACH ROW
-          EXECUTE PROCEDURE pgq.logutriga('%s')"""
-        self.exec_sql(q % (table_name, queue_name), [])
-    except Exception, e:
-      sys.exit(e)
-      
-  def do_uninstall(self):
-    try:
-      queue_name = self.cf.get("pgq_queue_name")
-      consumer = "HBaseReplic"
-      
-      #self.log.info('Unregistering consumer %s on queue %s' % (consumer, queue_name))
-      #self.exec_sql("select pgq.unregister_consumer(%s, %s)", [queue_name, consumer])
-  
-      for table_name in self.table_names:
-        self.log.info('Dropping trigger hbase_replic on table %s' % (table_name))
-        q = "DROP TRIGGER hbase_replic ON %s" % table_name
-        self.exec_sql(q, [])
-        
-    except Exception, e:
-      sys.exit(e)
-    
-  def exec_sql(self, q, args):
-    self.log.debug(q)
-    db = self.get_database('postgresql_db')
-    curs = db.cursor()
-    curs.execute(q, args)
-    db.commit()
-    
-if __name__ == '__main__':
-  script = HBaseReplic("HBaseReplic",sys.argv[1:])
-  script.start()
--- a/src/examples/uploaders/hbrep/pgq.ini
+++ b/src/examples/uploaders/hbrep/pgq.ini
@ -1,10 +0,0 @@
-[pgqadm]
-job_name = sourcedb_ticker
-db = dbname=source_database user=dbuser
-# how often to run maintenance [minutes]
-maint_delay_min = 1
-# how often to check for activity [secs]
-loop_delay = 0.2
-logfile = %(job_name)s.log
-pidfile = %(job_name)s.pid
-use_skylog = 0
--- a/src/examples/uploaders/hbrep/tablemapping.py
+++ b/src/examples/uploaders/hbrep/tablemapping.py
@ -1,33 +0,0 @@
-import sys, os
-from skytools.config import *
-
-PSQL_SCHEMA = "psql_schema"
-PSQL_TABLENAME = "psql_table_name"
-PSQL_KEYCOL = "psql_key_column"
-PSQL_COLUMNS = "psql_columns"
-HBASE_TABLENAME = "hbase_table_name"
-HBASE_COLUMNDESCS = "hbase_column_descriptors"
-HBASE_ROWPREFIX = "hbase_row_prefix"
-
-def load_table_mappings(config_file, table_names):
-  table_mappings = {}
-  for table_name in table_names:
-    conf = Config(table_name, config_file)
-    table_mappings[table_name] = PSqlHBaseTableMapping(conf)
-  return table_mappings
-  
-class PSqlHBaseTableMapping:
-  # conf can be anything with a get function eg, a dictionary
-  def __init__(self, conf):
-    self.psql_schema = conf.get(PSQL_SCHEMA)
-    self.psql_table_name = conf.get(PSQL_TABLENAME)
-    self.psql_key_column = conf.get(PSQL_KEYCOL)
-    self.psql_columns = conf.get(PSQL_COLUMNS).split()
-    self.hbase_table_name = conf.get(HBASE_TABLENAME)
-    self.hbase_column_descriptors = conf.get(HBASE_COLUMNDESCS).split()
-    self.hbase_row_prefix = conf.get(HBASE_ROWPREFIX)
-    
-    if len(self.psql_columns) != len(self.hbase_column_descriptors):
-      raise Exception("psql_columns and hbase_column_descriptors must have same length")
-    
-