RubyGems - bigrecord-driver - Versions diffs - 0.0.6 → 0.0.7 - Mend

bigrecord-driver 0.0.6 → 0.0.7

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (16) hide show

data/VERSION +1 -1
data/bin/bigrecord-driver +41 -40
data/bin/hbase-driver +12 -12
data/lib/big_record_driver.rb +13 -6
data/lib/big_record_driver/client.rb +32 -29
data/lib/big_record_driver/column_descriptor.rb +13 -16
data/lib/big_record_driver/exceptions.rb +12 -10
data/lib/big_record_driver/hbase_driver/server.rb +351 -320
data/lib/big_record_driver/server.rb +123 -0
data/lib/big_record_driver/version.rb +4 -2
data/test/abstract_test_client.rb +5 -6
data/test/test_client_hbase.rb +13 -17
metadata +3 -5
data/lib/big_record_driver/bigrecord_server.rb +0 -119
data/lib/big_record_driver/driver_manager.rb +0 -34
data/test/test_driver_manager.rb +0 -46

data/VERSION CHANGED Viewed

	@@ -1 +1 @@
1	- 0.0.6
1	+ 0.0.7

data/bin/bigrecord-driver CHANGED Viewed

@@ -62,7 +62,7 @@ unset RUBYLIB
 if [ "$DRIVERNAME" == "" ]; then
   echo "Driver type was not specified"
   exit 1
-elif [ "$DRIVERNAME" != "hbase" -a "$DRIVERNAME" != "cassandra" ]; then
+elif [ "$DRIVERNAME" != "hbase" ]; then
   echo "Driver type \"$DRIVERNAME\" is invalid"
   exit 1
 fi
@@ -126,30 +126,30 @@ start() {
     refresh_pids
     if [ -f "$PIDS_DIR/$PORT.pid" -a "$PID" != "" ] ; then
-        echo -e "\nAlready running (pid="$PID")."
-        exit 1
+      echo -e "\nAlready running (pid="$PID")."
+      exit 1
     else
 	    rm -f $LOGS_DIR/$PORT.log
 	    nohup jruby $DRIVER $PORT >> $LOGS_DIR/$PORT.log 2>&1 < /dev/null &
 	    PID=$!
 	    if [ "$PID" != "" ] ; then
-	        # monitor the log file for the message saying that the server is started
-	        for ((i=0; i<$STARTUP_TIMEOUT; i+=1)); do
-	          sleep 1
-	          echo -n "."
-	          if [ "$(cat $LOGS_DIR/$PORT.log | grep 'Started drb server')" != "" ] ; then
-	            break
-	          fi
-	        done
-	        if [ "$i" == $STARTUP_TIMEOUT ] ; then
-	          echo -e "\nStartup timeout: couldn't start the DRb server."
-	        else
-	          echo $PID > $PIDS_DIR/$PORT.pid
-	        fi
-	        echo ""
+        # monitor the log file for the message saying that the server is started
+        for ((i=0; i<$STARTUP_TIMEOUT; i+=1)); do
+          sleep 1
+          echo -n "."
+          if [ "$(cat $LOGS_DIR/$PORT.log | grep 'Started drb server')" != "" ] ; then
+            break
+          fi
+        done
+        if [ "$i" == $STARTUP_TIMEOUT ] ; then
+          echo -e "\nStartup timeout: couldn't start the DRb server."
+        else
+          echo $PID > $PIDS_DIR/$PORT.pid
+        fi
+        echo ""
 	    else
-            echo -e "\nAn error occured while starting the DRb server."
+        echo -e "\nAn error occured while starting the DRb server."
 	    fi
     fi
 }
@@ -161,8 +161,8 @@ stop() {
 	if [ -f "$PIDS_DIR/$PORT.pid" -a "$PID" != "" ] ; then
 		echo "Stopping driver (pid = $PID)." >> $LOGS_DIR/$PORT.log
-	    kill $PID
-	    rm $PIDS_DIR/$PORT.pid
+    kill $PID
+    rm $PIDS_DIR/$PORT.pid
 	else
 		echo "No $DRIVERNAME driver to kill."
 	fi
@@ -183,24 +183,25 @@ start_debug() {
 }
 case "$ACTION" in
-    start)
-   		start
-        ;;
-    stop)
-   		stop
-        ;;
-    restart)
-   		stop
-   		start
-        ;;
-    status)
-        status
-        ;;
-    start_debug)
-    	start_debug
-    	;;
-    *)
-        print_usage
-        exit 1
+  start)
+	  start
+    ;;
+  stop)
+	  stop
+    ;;
+  restart)
+	  stop
+	  start
+    ;;
+  status)
+    status
+    ;;
+  start_debug)
+	  start_debug
+	  ;;
+  *)
+    print_usage
+    exit 1
 esac
 exit 0

data/bin/hbase-driver CHANGED Viewed

@@ -11,22 +11,22 @@ if ARGV.include?("-l")
   # Make sure that the folder exists
   if File.exists?(hbase_path)
-	# We're only going to include the jar files we need.
-	required_jars = Dir[hbase_path+"/*.jar",
-						hbase_path+"/lib/commons-logging*.jar",
-						hbase_path+"/lib/zookeeper*.jar",
-						hbase_path+"/lib/log4j*.jar",
-						hbase_path+"/lib/hadoop*.jar"]
-	classpath = required_jars.join(":")
+	  # We're only going to include the jar files we need.
+	  required_jars = Dir[hbase_path+"/*.jar",
+						  hbase_path+"/lib/commons-logging*.jar",
+						  hbase_path+"/lib/zookeeper*.jar",
+						  hbase_path+"/lib/log4j*.jar",
+						  hbase_path+"/lib/hadoop*.jar"]
+	  classpath = required_jars.join(":")
-	args.delete_at(switch_index)
-	args.delete_at(switch_index)
-	args = args + ["-c", '"'+classpath+'"']
+	  args.delete_at(switch_index)
+	  args.delete_at(switch_index)
+	  args = args + ["-c", '"'+classpath+'"']
   # Otherwise we'll warn the user and quit
   else
-	puts "Folder #{hbase_path} does not exist"
-	exit
+	  puts "Folder #{hbase_path} does not exist"
+	  exit
   end
 end

data/lib/big_record_driver.rb CHANGED Viewed

@@ -1,7 +1,14 @@
-LIB_ROOT = File.dirname(__FILE__)
+module BigRecord
+  module Driver
+  end
+end
-require LIB_ROOT + '/big_record_driver/client'
-require LIB_ROOT + '/big_record_driver/exceptions'
-require LIB_ROOT + '/big_record_driver/column_descriptor'
-require LIB_ROOT + '/big_record_driver/driver_manager'
-require LIB_ROOT + '/big_record_driver/version'
+BRD_ROOT = File.dirname(__FILE__)
+require BRD_ROOT + '/big_record_driver/client'
+require BRD_ROOT + '/big_record_driver/exceptions'
+require BRD_ROOT + '/big_record_driver/column_descriptor'
+require BRD_ROOT + '/big_record_driver/version'
+# Aliasing the old namespace
+BigRecordDriver = BigRecord::Driver

data/lib/big_record_driver/client.rb CHANGED Viewed

@@ -1,36 +1,39 @@
-require 'rubygems'
-require 'activesupport'
+require 'active_support'
 require 'set'
 require 'drb'
-module BigRecordDriver
-  class Client
-    def initialize(config={}) # :nodoc:
-      config = config.symbolize_keys
-      config[:drb_host]     ||= '127.0.0.1'
-      config[:drb_port]     ||= 40000
-      @config = config
-      DRb.start_service('druby://127.0.0.1:0')
-      begin
-        @server = DRbObject.new(nil, "druby://#{@config[:drb_host]}:#{@config[:drb_port]}")
-      rescue DRb::DRbConnError
-        raise ConnectionError, "Failed to connect to the DRb server (jruby) " +
-                                      "at #{@config[:drb_host]}:#{@config[:drb_port]}."
+module BigRecord
+  module Driver
+    class Client
+      attr_accessor :config, :server
+      def initialize(config={}) # :nodoc:
+        config = config.symbolize_keys
+        config[:drb_host] ||= '127.0.0.1'
+        config[:drb_port] ||= 40000
+        @config = config
+        DRb.start_service nil
+        begin
+          @server = DRbObject.new(nil, "druby://#{@config[:drb_host]}:#{@config[:drb_port]}")
+        rescue DRb::DRbConnError
+          raise ConnectionError, "Failed to connect to the DRb server (jruby) " +
+                                        "at #{@config[:drb_host]}:#{@config[:drb_port]}."
+        end
+        @server.configure(@config)
+      end
+      # Delegate the methods to the server
+      def method_missing(method, *args)
+        @server.send(method, *args)
+      end
+      def respond_to?(method)
+        super
       end
-      @server.configure(@config)
-    end
-    # Delegate the methods to the server
-    def method_missing(method, *args)
-      @server.send(method, *args)
-    end
-    def respond_to?(method)
-      super
     end
   end
 end

data/lib/big_record_driver/column_descriptor.rb CHANGED Viewed

@@ -1,23 +1,20 @@
-module BigRecordDriver
+module BigRecord
+  module Driver
-  class ColumnDescriptor
+    class ColumnDescriptor
+      attr_accessor :name, :versions, :in_memory, :bloom_filter, :compression
-    attr_accessor :name
-    attr_accessor :versions
-    attr_accessor :in_memory
-    attr_accessor :bloom_filter
-    attr_accessor :compression
+      def initialize(name, options={})
+        raise ArgumentError, "name is mandatory" unless name
-    def initialize(name, options={})
-      raise ArgumentError, "name is mandatory" unless name
-      @name = name.to_s
-      @versions         = options[:versions]
-      @in_memory        = options[:in_memory]
-      @bloom_filter     = options[:bloom_filter]
-      @compression      = options[:compression]
+        @name = name.to_s
+        @versions     = options[:versions]
+        @in_memory    = options[:in_memory]
+        @bloom_filter = options[:bloom_filter]
+        @compression  = options[:compression]
+      end
     end
   end
 end

data/lib/big_record_driver/exceptions.rb CHANGED Viewed

@@ -1,12 +1,14 @@
-module BigRecordDriver
-  class BigDBError < StandardError
-  end
-  class TableNotFound < BigDBError
-  end
-  class TableAlreadyExists < BigDBError
-  end
-  class JavaError < BigDBError
-  end
-  class ConnectionError < BigDBError
+module BigRecord
+  module Driver
+    class DriverError < StandardError
+    end
+    class TableNotFound < DriverError
+    end
+    class TableAlreadyExists < DriverError
+    end
+    class JavaError < DriverError
+    end
+    class ConnectionError < DriverError
+    end
   end
 end

data/lib/big_record_driver/hbase_driver/server.rb CHANGED Viewed

@@ -1,396 +1,427 @@
 require File.dirname(__FILE__) + '/../column_descriptor'
 require File.dirname(__FILE__) + '/../exceptions'
-require File.dirname(__FILE__) + '/../bigrecord_server'
+require File.dirname(__FILE__) + '/../server'
-module BigRecordDriver
+module BigRecord
+  module Driver
-class HbaseServer < BigRecordServer
-  include_class "java.util.TreeMap"
+    class HbaseServer < Server
+      java_import "java.util.TreeMap"
+      include_package "org.apache.hadoop.hbase.client"
+      java_import "org.apache.hadoop.hbase.KeyValue"
+      java_import "org.apache.hadoop.hbase.io.hfile.Compression"
+      java_import "org.apache.hadoop.hbase.HBaseConfiguration"
+      java_import "org.apache.hadoop.hbase.HTableDescriptor"
+      java_import "org.apache.hadoop.hbase.HColumnDescriptor"
-  include_class "org.apache.hadoop.hbase.client.HTable"
-  include_class "org.apache.hadoop.hbase.client.HBaseAdmin"
-  include_class "org.apache.hadoop.hbase.io.BatchUpdate"
-  include_class "org.apache.hadoop.hbase.io.hfile.Compression"
-  include_class "org.apache.hadoop.hbase.HBaseConfiguration"
-  include_class "org.apache.hadoop.hbase.HConstants"
-  include_class "org.apache.hadoop.hbase.HStoreKey"
-  include_class "org.apache.hadoop.hbase.HTableDescriptor"
-  include_class "org.apache.hadoop.hbase.HColumnDescriptor"
+      # Establish the connection with HBase with the given configuration parameters.
+      def configure(config = {})
+        config[:zookeeper_quorum]       ||= 'localhost'
+        config[:zookeeper_client_port]  ||= '2181'
-  include_class "org.apache.hadoop.io.Writable"
+        @config = config
-  # Establish the connection with HBase with the given configuration parameters.
-  def configure(config = {})
-    config[:zookeeper_quorum]        ||= 'localhost'
-    config[:zookeeper_client_port]  ||= '2181'
+        init_connection
+      end
-    @config = config
+      # Atomic row insertion/update. Example:
+      #   update('entities', 'b9cef848-a4e0-11dc-a7ba-0018f3137ea8', {'attribute:name' => "--- Oahu\n",
+      #                                                               'attribute:travel_rank' => "--- 0.90124565\n"})
+      #   => 'b9cef848-a4e0-11dc-a7ba-0018f3137ea8'
+      def update(table_name, row, values, timestamp=nil)
+        safe_exec do
+          return nil unless row
-    init_connection
-  end
+          table = connect_table(table_name)
+          row_lock = table.lockRow(row.to_bytes)
-  # Atomic row insertion/update. Example:
-  #   update('entities', 'b9cef848-a4e0-11dc-a7ba-0018f3137ea8', {'attribute:name' => "--- Oahu\n",
-  #                                                               'attribute:travel_rank' => "--- 0.90124565\n"})
-  #   => 'b9cef848-a4e0-11dc-a7ba-0018f3137ea8'
-  def update(table_name, row, values, timestamp=nil)
-    safe_exec do
-      return nil unless row
-      table = connect_table(table_name)
+          put = generate_put(row, values, timestamp, row_lock)
+          table.put(put)
-      batch = timestamp ? BatchUpdate.new(row, timestamp) : BatchUpdate.new(row)
+          table.unlockRow(row_lock)
-      values.each do |column, value|
-        batch.put(column, value.to_bytes)
+          row
+        end
       end
-      table.commit(batch)
-      row
-    end
-  end
+      # Returns a column of a row. Example:
+      #   get('entities', 'b9cef848-a4e0-11dc-a7ba-0018f3137ea8', 'attribute:travel_rank')
+      #   => "--- 0.90124565\n"
+      #
+      # valid options:
+      #   :timestamp  => integer corresponding to the time when the record was saved in hbase
+      #   :versions   => number of versions to retreive, starting at the specified timestamp (or the latest)
+      def get(table_name, row, column, options={})
+        safe_exec do
+          return nil unless row
+          table = connect_table(table_name)
+          # Grab the version number if the client's using the old API,
+          # or retrieve only the lastest version by default
+          options[:versions] ||= options[:num_versions]
+          options[:versions] ||= 1
+          # validate the arguments
+          raise ArgumentError, "versions must be >= 1" unless options[:versions] >= 1
+          get = generate_get(row, column, options)
+          result = table.get(get)
+          if (result.nil? || result.isEmpty)
+            return (options[:versions] == 1 ? nil : [])
+          else
+            output = result.list.collect do |keyvalue|
+              to_ruby_string(keyvalue.getValue)
+            end
-  # Returns a column of a row. Example:
-  #   get('entities', 'b9cef848-a4e0-11dc-a7ba-0018f3137ea8', 'attribute:travel_rank')
-  #   => "--- 0.90124565\n"
-  #
-  # valid options:
-  #   :timestamp      => integer corresponding to the time when the record was saved in hbase
-  #   :versions   => number of versions to retreive, starting at the specified timestamp (or the latest)
-  def get(table_name, row, column, options={})
-    safe_exec do
-      return nil unless row
-      table = connect_table(table_name)
-      # Retreive only the last version by default
-      options[:versions] ||= options[:num_versions]
-      options[:versions] ||= 1
-      # validate the arguments
-      raise ArgumentError, "versions must be >= 1" unless options[:versions] >= 1
-      # get the raw data from hbase
-      unless options[:timestamp]
-        if options[:versions] == 1
-          raw_data = table.get(row, column)
-        else
-          raw_data = table.get(row,
-                                column,
-                                options[:versions])
+            return (options[:versions] == 1 ? output[0] : output)
+          end
         end
-      else
-        raw_data = table.get(row,
-                              column,
-                              options[:timestamp],
-                              options[:versions])
       end
-      # Return either a single value or an array, depending on the number of version that have been requested
-      if options[:versions] == 1
-        return nil unless raw_data
-        raw_data = raw_data[0] if options[:timestamp]
-        to_ruby_string(raw_data)
-      else
-        return [] unless raw_data
-        raw_data.collect do |raw_data_version|
-          to_ruby_string(raw_data_version)
+      # Returns the last version of the given columns of the given row. The columns works with
+      # regular expressions (e.g. 'attribute:' matches all attributes columns). Example:
+      #   get_columns('entities', 'b9cef848-a4e0-11dc-a7ba-0018f3137ea8', ['attribute:'])
+      #   => {"attribute:name" => "--- Oahu\n", "attribute:travel_rank" => "--- 0.90124565\n", etc...}
+      def get_columns(table_name, row, columns, options={})
+        safe_exec do
+          return nil unless row
+          table_name = table_name.to_s
+          table = connect_table(table_name)
+          get = generate_get(row, columns, options)
+          result = table.get(get)
+          begin
+            parse_result(result)
+          rescue
+            nil
+          end
         end
       end
-    end
-  end
-  # Returns the last version of the given columns of the given row. The columns works with
-  # regular expressions (e.g. 'attribute:' matches all attributes columns). Example:
-  #   get_columns('entities', 'b9cef848-a4e0-11dc-a7ba-0018f3137ea8', ['attribute:'])
-  #   => {"attribute:name" => "--- Oahu\n", "attribute:travel_rank" => "--- 0.90124565\n", etc...}
-  def get_columns(table_name, row, columns, options={})
-    safe_exec do
-      return nil unless row
-      table_name = table_name.to_s
-      table = connect_table(table_name)
-      java_cols = Java::String[columns.size].new
-      columns.each_with_index do |col, i|
-        java_cols[i] = Java::String.new(col)
-      end
+      # Get consecutive rows. Example to get 100 records starting with the one specified and get all the
+      # columns in the column family 'attribute:' :
+      #   get_consecutive_rows('entities', 'b9cef848-a4e0-11dc-a7ba-0018f3137ea8', 100, ['attribute:'])
+      def get_consecutive_rows(table_name, start_row, limit, columns, stop_row = nil)
+        safe_exec do
+          table_name = table_name.to_s
+          table = connect_table(table_name)
-      result =
-      if options[:timestamp]
-        table.getRow(row, java_cols, options[:timestamp])
-      else
-        table.getRow(row, java_cols)
-      end
+          scan = Scan.new
+          scan.setStartRow(start_row.to_bytes) if start_row
+          scan.setStopRow(stop_row.to_bytes) if stop_row
+          columns.each do |column|
+            (column[-1,1] == ":") ?
+              scan.addFamily(column.gsub(":", "").to_bytes) :
+              scan.addColumn(column.to_bytes)
+          end
+          scanner = table.getScanner(scan)
-      unless !result or result.isEmpty
-        values = {}
-        result.entrySet.each do |entry|
-          column_name = Java::String.new(entry.getKey).to_s
-          values[column_name] = to_ruby_string(entry.getValue)
+          if limit
+            results = scanner.next(limit)
+          else
+            results = []
+            while (row_result = scanner.next) != nil
+              results << row_result
+            end
+          end
+          output = []
+          results.each do |result|
+            output << parse_result(result)
+          end
+          scanner.close
+          return output
         end
-        values["id"] = row
-        values
-      else
-        nil
       end
-    end
-  end
-  # Get consecutive rows. Example to get 100 records starting with the one specified and get all the
-  # columns in the column family 'attribute:' :
-  #   get_consecutive_rows('entities', 'b9cef848-a4e0-11dc-a7ba-0018f3137ea8', 100, ['attribute:'])
-  def get_consecutive_rows(table_name, start_row, limit, columns, stop_row = nil)
-    safe_exec do
-      table_name = table_name.to_s
-      table = connect_table(table_name)
-      java_cols = Java::String[columns.size].new
-      columns.each_with_index do |col, i|
-        java_cols[i] = Java::String.new(col)
+      # Delete a whole row.
+      def delete(table_name, row, timestamp = nil)
+        safe_exec do
+          table = connect_table(table_name)
+          if timestamp
+            row_lock = table.lockRow(row.to_bytes)
+            table.delete(Delete.new(row.to_bytes, timestamp, row_lock))
+            table.unlockRow(row_lock)
+          else
+            table.delete(Delete.new(row.to_bytes))
+          end
+        end
       end
-      start_row ||= ""
-      start_row = start_row.to_s
+      # Create a table
+      def create_table(table_name, column_descriptors)
+        safe_exec do
+          table_name = table_name.to_s
+          unless table_exists?(table_name)
+            tdesc = HTableDescriptor.new(table_name)
-      # We cannot set stop_row like start_row because a
-      # default stop row would have to be the biggest value possible
-      if stop_row
-        scanner = table.getScanner(java_cols, start_row, stop_row, HConstants::LATEST_TIMESTAMP)
-      else
-        scanner = table.getScanner(java_cols, start_row)
-      end
+            column_descriptors.each do |cd|
+              cdesc = generate_column_descriptor(cd)
-      row_count = 0 if limit
-      result = []
-      while (row_result = scanner.next) != nil
-        if limit
-          break if row_count == limit
-          row_count += 1
-        end
-        values = {}
-        row_result.entrySet.each do |entry|
-          column_name = Java::String.new(entry.getKey).to_s
-          data = to_ruby_string(entry.getValue)
-          values[column_name] = data
+              tdesc.addFamily(cdesc)
+            end
+            @admin.createTable(tdesc)
+          else
+            raise TableAlreadyExists, table_name
+          end
         end
-        unless values.empty?
-          # TODO: is this really supposed to be hard coded?
-          values['id'] = Java::String.new(row_result.getRow).to_s
-          result << values
+      end
+      # Delete a table
+      def drop_table(table_name)
+        safe_exec do
+          table_name = table_name.to_s
+          if @admin.tableExists(table_name)
+            @admin.disableTable(table_name)
+            @admin.deleteTable(table_name)
+            # Remove the table connection from the cache
+            @tables.delete(table_name) if @tables.has_key?(table_name)
+          else
+            raise TableNotFound, table_name
+          end
         end
       end
-      scanner.close
-      result
-    end
-  end
-  # Delete a whole row.
-  def delete(table_name, row, timestamp = nil)
-    safe_exec do
-      table = connect_table(table_name)
-      timestamp ? table.deleteAll(row.to_bytes, timestamp) : table.deleteAll(row.to_bytes)
-    end
-  end
+      def add_column(table_name, column_descriptor)
+        safe_exec do
+          table_name = table_name.to_s
-  # Create a table
-  def create_table(table_name, column_descriptors)
-    safe_exec do
-      table_name = table_name.to_s
-      unless table_exists?(table_name)
-        tdesc = HTableDescriptor.new(table_name)
+          if @admin.tableExists(table_name)
+            @admin.disableTable(table_name)
-        column_descriptors.each do |cd|
-          cdesc = generate_column_descriptor(cd)
+            cdesc = generate_column_descriptor(column_descriptor)
+            @admin.addColumn(table_name, cdesc)
-          tdesc.addFamily(cdesc)
+            @admin.enableTable(table_name)
+          else
+            raise TableNotFound, table_name
+          end
         end
-        @admin.createTable(tdesc)
-      else
-        raise BigRecordDriver::TableAlreadyExists, table_name
       end
-    end
-  end
-  # Delete a table
-  def drop_table(table_name)
-    safe_exec do
-      table_name = table_name.to_s
+      def remove_column(table_name, column_name)
+        safe_exec do
+          table_name = table_name.to_s
+          column_name = column_name.to_s
+          if @admin.tableExists(table_name)
+            @admin.disableTable(table_name)
-      if @admin.tableExists(table_name)
-        @admin.disableTable(table_name)
-        @admin.deleteTable(table_name)
+            column_name << ":" unless column_name =~ /:$/
+            @admin.deleteColumn(table_name, column_name)
-        # Remove the table connection from the cache
-        @tables.delete(table_name) if @tables.has_key?(table_name)
-      else
-        raise BigRecordDriver::TableNotFound, table_name
+            @admin.enableTable(table_name)
+          else
+            raise TableNotFound, table_name
+          end
+        end
       end
-    end
-  end
-  def add_column(table_name, column_descriptor)
-    safe_exec do
-      table_name = table_name.to_s
+      def modify_column(table_name, column_descriptor)
+        safe_exec do
+          table_name = table_name.to_s
-      if @admin.tableExists(table_name)
-        @admin.disableTable(table_name)
+          if @admin.tableExists(table_name)
+            @admin.disableTable(table_name)
-        cdesc = generate_column_descriptor(column_descriptor)
-        @admin.addColumn(table_name, cdesc)
+            cdesc = generate_column_descriptor(column_descriptor)
+            @admin.modifyColumn(table_name, column_descriptor.name, cdesc)
-        @admin.enableTable(table_name)
-      else
-        raise BigRecordDriver::TableNotFound, table_name
+            @admin.enableTable(table_name)
+          else
+            raise TableNotFound, table_name
+          end
+        end
       end
-    end
-  end
-  def remove_column(table_name, column_name)
-    safe_exec do
-      table_name = table_name.to_s
-      column_name = column_name.to_s
+      def truncate_table(table_name)
+        safe_exec do
+          table_name = table_name.to_s
+          table = connect_table(table_name)
+          tableDescriptor = table.getTableDescriptor
+          drop_table(table_name)
+          @admin.createTable(tableDescriptor)
+        end
+      end
-      if @admin.tableExists(table_name)
-        @admin.disableTable(table_name)
+      def ping
+        safe_exec do
+          @admin.isMasterRunning
+        end
+      end
-        column_name << ":" unless column_name =~ /:$/
-        @admin.deleteColumn(table_name, column_name)
+      def table_exists?(table_name)
+        safe_exec do
+          @admin.tableExists(table_name.to_s)
+        end
+      end
-        @admin.enableTable(table_name)
-      else
-        raise BigRecordDriver::TableNotFound, table_name
+      def table_names
+        safe_exec do
+          @admin.listTables.collect{|td| Java::String.new(td.getName).to_s}
+        end
       end
-    end
-  end
-  def modify_column(table_name, column_descriptor)
-    safe_exec do
-      table_name = table_name.to_s
-      column_name = column_name.to_s
+    private
-      if @admin.tableExists(table_name)
-        @admin.disableTable(table_name)
+      def init_connection
+        safe_exec do
+          @conf = HBaseConfiguration.new
+          @conf.set('hbase.zookeeper.quorum', "#{@config[:zookeeper_quorum]}")
+          @conf.set('hbase.zookeeper.property.clientPort', "#{@config[:zookeeper_client_port]}")
+          @admin = HBaseAdmin.new(@conf)
+          @tables = {}
+        end
+      end
-        cdesc = generate_column_descriptor(column_descriptor)
-        @admin.modifyColumn(table_name, column_descriptor.name, cdesc)
+      # Create a connection to an HBase table and keep it in memory.
+      def connect_table(table_name)
+        safe_exec do
+          table_name = table_name.to_s
+          return @tables[table_name] if @tables.has_key?(table_name)
-        @admin.enableTable(table_name)
-      else
-        raise BigRecordDriver::TableNotFound, table_name
+          if table_exists?(table_name)
+            @tables[table_name] = HTable.new(@conf, table_name)
+          else
+            if table_name and !table_name.empty?
+              raise TableNotFound, table_name
+            else
+              raise ArgumentError, "Table name not specified"
+            end
+          end
+          @tables[table_name]
+        end
       end
-    end
-  end
-  def truncate_table(table_name)
-    safe_exec do
-      table_name = table_name.to_s
-      table = connect_table(table_name)
-      tableDescriptor = table.getTableDescriptor
-      drop_table(table_name)
-      @admin.createTable(tableDescriptor)
-    end
-  end
+      # Create a Get object given parameters.
+      #
+      # @param [String] row
+      # @param [Array, String] A single (or collection) of strings
+      #     fully qualified column name or column family (ends with ':').
+      # @param [Hash] options
+      #
+      # @return [Get] org.apache.hadoop.hbase.client.Get object
+      #     corresponding to the arguments passed.
+      def generate_get(row, columns, options = {})
+        columns = [columns].flatten
+        get = Get.new(row.to_bytes)
+        columns.each do |column|
+          # If the column name ends with ':' then it's a column family.
+          (column[-1,1] == ":") ?
+            get.addFamily(column.gsub(":", "").to_bytes) :
+            get.addColumn(column.to_bytes)
+        end
-  def ping
-    safe_exec do
-      @admin.isMasterRunning
-    end
-  end
+        get.setMaxVersions(options[:versions]) if options[:versions]
-  def table_exists?(table_name)
-    safe_exec do
-      @admin.tableExists(table_name.to_s)
-    end
-  end
+        # Need to add 1 to the timestamp due to the the API sillyness, i.e. min timestamp
+        # is inclusive while max timestamp is exclusive.
+        get.setTimeRange(java.lang.Long::MIN_VALUE, options[:timestamp]+1) if options[:timestamp]
-  def table_names
-    safe_exec do
-      @admin.listTables.collect{|td| Java::String.new(td.getName).to_s}
-    end
-  end
+        return get
+      end
-#  def const_missing(const)
-#    super
-#  rescue NameError => ex
-#    raise NameError, "uninitialized constant #{const}"
-#  end
-private
-  # Create a connection to a Hbase table and keep it in memory.
-  def connect_table(table_name)
-    safe_exec do
-      table_name = table_name.to_s
-      return @tables[table_name] if @tables.has_key?(table_name)
-      if table_exists?(table_name)
-        @tables[table_name] = HTable.new(@conf, table_name)
-      else
-        if table_name and !table_name.empty?
-          raise BigRecordDriver::TableNotFound, table_name
-        else
-          raise ArgumentError, "Table name not specified"
+      # Create a Put object given parameters.
+      #
+      # @param [String] row
+      # @param [Hash] Keys as the fully qualified column names and
+      #     their associated values.
+      # @param [Integer] timestamp
+      # @param [org.apache.hadoop.hbase.client.RowLock] row_lock
+      #
+      # @return [Put] org.apache.hadoop.hbase.client.Put object
+      #     corresponding to the arguments passed.
+      def generate_put(row, columns = {}, timestamp = nil, row_lock = nil)
+        put = row_lock ? Put.new(row.to_bytes, row_lock) : Put.new(row.to_bytes)
+        columns.each do |name, value|
+          family, qualifier = name.split(":")
+          timestamp ?
+            put.add(family.to_bytes, qualifier.to_bytes, timestamp, value.to_bytes) :
+            put.add(family.to_bytes, qualifier.to_bytes, value.to_bytes)
         end
+        return put
       end
-      @tables[table_name]
-    end
-  end
-  def init_connection
-    safe_exec do
-      @conf = HBaseConfiguration.new
-      @conf.set('hbase.zookeeper.quorum', "#{@config[:zookeeper_quorum]}")
-      @conf.set('hbase.zookeeper.property.clientPort', "#{@config[:zookeeper_client_port]}")
-      @admin = HBaseAdmin.new(@conf)
-      @tables = {}
-    end
-  end
+      # Parse a Result object into a Hash.
+      #
+      # @param [Result] result
+      #
+      # @return [Hash] Fully qualified column names as keys
+      #     and their corresponding values.
+      def parse_result(result)
+        output = {}
+        result.list.each do |keyvalue|
+          output[to_ruby_string(keyvalue.getColumn)] = to_ruby_string(keyvalue.getValue)
+        end
-  def generate_column_descriptor(column_descriptor)
-    raise ArgumentError, "a column descriptor is missing a name" unless column_descriptor.name
-    raise "bloom_filter option not supported yet" if column_descriptor.bloom_filter
+        output["id"] = to_ruby_string(result.getRow)
-    if column_descriptor.compression
-      compression =
-        case column_descriptor.compression.to_s
-          when 'none';   Compression::Algorithm::NONE.getName()
-          when 'gz';     Compression::Algorithm::GZ.getName()
-          when 'lzo';    Compression::Algorithm::LZO.getName()
-          else
-            raise ArgumentError, "Invalid compression type: #{column_descriptor.compression} for the column_family #{column_descriptor.name}"
+        return output
+      end
+      def generate_column_descriptor(column_descriptor)
+        raise ArgumentError, "a column descriptor is missing a name" unless column_descriptor.name
+        raise "bloom_filter option not supported yet" if column_descriptor.bloom_filter
+        if column_descriptor.compression
+          compression =
+            case column_descriptor.compression.to_s
+              when 'none';   Compression::Algorithm::NONE.getName()
+              when 'gz';     Compression::Algorithm::GZ.getName()
+              when 'lzo';    Compression::Algorithm::LZO.getName()
+              else
+                raise ArgumentError, "Invalid compression type: #{column_descriptor.compression} for the column_family #{column_descriptor.name}"
+            end
         end
-    end
-    n_versions    = column_descriptor.versions
-    in_memory     = column_descriptor.in_memory
-    # set the default values of the missing parameters
-    n_versions        ||= HColumnDescriptor::DEFAULT_VERSIONS
-    compression       ||= HColumnDescriptor::DEFAULT_COMPRESSION
-    in_memory         ||= HColumnDescriptor::DEFAULT_IN_MEMORY
-    block_cache       ||= HColumnDescriptor::DEFAULT_BLOCKCACHE
-    block_size        ||= HColumnDescriptor::DEFAULT_BLOCKSIZE
-    bloomfilter       ||= HColumnDescriptor::DEFAULT_BLOOMFILTER
-    ttl               ||= HColumnDescriptor::DEFAULT_TTL
-    # add the ':' at the end if the user didn't specify it
-    column_descriptor.name << ":" unless column_descriptor.name =~ /:$/
-    cdesc = HColumnDescriptor.new(column_descriptor.name.to_bytes,
-                                  n_versions,
-                                  compression,
-                                  in_memory,
-                                  block_cache,
-                                  block_size,
-                                  ttl,
-                                  bloomfilter)
-    return cdesc
-  end
+        n_versions    = column_descriptor.versions
+        in_memory     = column_descriptor.in_memory
+        # set the default values of the missing parameters
+        n_versions        ||= HColumnDescriptor::DEFAULT_VERSIONS
+        compression       ||= HColumnDescriptor::DEFAULT_COMPRESSION
+        in_memory         ||= HColumnDescriptor::DEFAULT_IN_MEMORY
+        block_cache       ||= HColumnDescriptor::DEFAULT_BLOCKCACHE
+        block_size        ||= HColumnDescriptor::DEFAULT_BLOCKSIZE
+        bloomfilter       ||= HColumnDescriptor::DEFAULT_BLOOMFILTER
+        ttl               ||= HColumnDescriptor::DEFAULT_TTL
+        # add the ':' at the end if the user didn't specify it
+        column_descriptor.name << ":" unless column_descriptor.name =~ /:$/
+        cdesc = HColumnDescriptor.new(column_descriptor.name.to_bytes,
+                                      n_versions,
+                                      compression,
+                                      in_memory,
+                                      block_cache,
+                                      block_size,
+                                      ttl,
+                                      bloomfilter)
+        return cdesc
+      end
-end
+    end
+  end
 end
-port = ARGV[0]
-port ||= 40000
-DRb.start_service("druby://:#{port}", BigRecordDriver::HbaseServer.new)
+port = ARGV[0] || 40000
+DRb.start_service("druby://:#{port}", BigRecord::Driver::HbaseServer.new)
 puts "Started drb server on port #{port}."
 DRb.thread.join