summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorJohn Seekins <john.seekins@oracle.com>2014-10-08 15:27:10 -0600
committerJohn Seekins <john.seekins@oracle.com>2014-10-08 15:27:10 -0600
commit934096975087364842a92decd1bae1611aa4a685 (patch)
treeef8f2b304d0dd602920926c5813ce2344f98d326
parentecc53df4ce06d279a52358fa1c6f4df7168e0aa2 (diff)
downloadhappybase-934096975087364842a92decd1bae1611aa4a685.tar.gz
Add support for TCompactProtocol
-rw-r--r--happybase/connection.py27
1 files changed, 23 insertions, 4 deletions
diff --git a/happybase/connection.py b/happybase/connection.py
index 11f353e..26ee2bd 100644
--- a/happybase/connection.py
+++ b/happybase/connection.py
@@ -8,7 +8,7 @@ import logging
from thrift.transport.TSocket import TSocket
from thrift.transport.TTransport import TBufferedTransport, TFramedTransport
-from thrift.protocol import TBinaryProtocol
+from thrift.protocol import TBinaryProtocol, TCompactProtocol
from .hbase import Hbase
from .hbase.ttypes import ColumnDescriptor
@@ -23,11 +23,16 @@ THRIFT_TRANSPORTS = dict(
framed=TFramedTransport,
)
+THRIFT_PROTOCOLS = dict(
+ binary=TBinaryProtocol.TBinaryProtocolAccelerated,
+ compact=TCompactProtocol.TCompactProtocol,
+)
+
DEFAULT_HOST = 'localhost'
DEFAULT_PORT = 9090
DEFAULT_TRANSPORT = 'buffered'
DEFAULT_COMPAT = '0.96'
-
+DEFAULT_PROTOCOL = 'binary'
class Connection(object):
"""Connection to an HBase Thrift server.
@@ -67,6 +72,15 @@ class Connection(object):
``-hsha``, ``-nonblocking``, and ``-threadedselector`` modes use the
framed transport.
+ The optional `protocol` argument specifies the Thrift transport
+ protocol to use. Supported values for this argument are ``binary``
+ (the default) and ``compact``. Make sure to choose the right one,
+ since otherwise you might see non-obvious connection errors or
+ program hangs when making a connection. TCompactProtocol is a
+ more compact binary format that is typically more efficient to
+ process as well. TBinaryAccelerated is the default protocol that
+ happybase uses.
+
.. versionadded:: 0.5
`timeout` argument
@@ -88,7 +102,7 @@ class Connection(object):
def __init__(self, host=DEFAULT_HOST, port=DEFAULT_PORT, timeout=None,
autoconnect=True, table_prefix=None,
table_prefix_separator='_', compat=DEFAULT_COMPAT,
- transport=DEFAULT_TRANSPORT):
+ transport=DEFAULT_TRANSPORT, protocol=DEFAULT_PROTOCOL):
if transport not in THRIFT_TRANSPORTS:
raise ValueError("'transport' must be one of %s"
@@ -105,6 +119,10 @@ class Connection(object):
raise ValueError("'compat' must be one of %s"
% ", ".join(COMPAT_MODES))
+ if protocol not in THRIFT_PROTOCOLS:
+ raise ValueError("'protocol' must be one of %s"
+ % ", ".join(THRIFT_PROTOCOLS))
+
# Allow host and port to be None, which may be easier for
# applications wrapping a Connection instance.
self.host = host or DEFAULT_HOST
@@ -115,6 +133,7 @@ class Connection(object):
self.compat = compat
self._transport_class = THRIFT_TRANSPORTS[transport]
+ self._protocol_class = THRIFT_PROTOCOLS[protocol]
self._refresh_thrift_client()
if autoconnect:
@@ -129,7 +148,7 @@ class Connection(object):
socket.setTimeout(self.timeout)
self.transport = self._transport_class(socket)
- protocol = TBinaryProtocol.TBinaryProtocolAccelerated(self.transport)
+ protocol = self._protocol_class(self.transport)
self.client = Hbase.Client(protocol)
def _table_name(self, name):