python 调用HBase 范例

发布时间:2018-10-02 02:10:30   来源:文档文库   
字号:

python 调用HBase 范例

python 调用HBase 实例

新来的一个工程师不懂HBasejava不熟,python还行,我建议他那可以考虑用HBasethrift调用,完成目前的工作。

首先,安装thrift

下载thrift,这里,我用的是thrift-0.7.0-dev.tar.gz 这个版本

tar xzf thrift-0.7.0-dev.tar.gz

cd thrift-0.7.0-dev

sudo ./configure --with-cpp=no --with-ruby=no

sudo make

sudo make install然后,到HBase的源码包里,找到

src/main/resources/org/apache/hadoop/hbase/thrift/

执行

thrift --gen py Hbase.thrift

mv gen-py/hbase/ /usr/lib/python2.4/site-packages/ (根据python版本可能有不同)我这里写了些调用的脚本,供大家参考from unittest import TestCase, main

from thrift import Thrift

from thrift.transport import TSocket

from thrift.transport import TTransport

from thrift.protocol import TBinaryProtocol

from hbase import Hbase

from hbase.ttypes import ColumnDescriptor, Mutation, BatchMutation

class HBaseTester:

def __init__(self, netloc, port, table="staftesttable"):

self.tableName = table

self.transport = TTransport.TBufferedTransport(

TSocket.TSocket(netloc, port))

self.protocol = TBinaryProtocol.TBinaryProtocol(self.transport)

self.client = Hbase.Client(self.protocol)

self.transport.open()

tables = self.client.getTableNames()

if self.tableName not in tables:

self.__createTable()

def __del__(self):

self.transport.close()

def __createTable(self):

name = ColumnDescriptor(name='name')

foo = ColumnDescriptor(name='foo')

self.client.createTable(self.tableName,

[name,foo])

def put(self,key,name,foo):

name = Mutation(column="name:v", value=name)

foo = Mutation(column="foo:v",value=foo)

self.client.mutateRow(self.tablename,key,[name,foo])

def scanner(self,column):

scanner = client.scannerOpen(self.tablename,"",[column])

r = client.scannerGet(scanner)

result= []

while r:

print r[0]

result.append(r[0])

r = client.scannerGet(scanner)

print "Scanner finished"

return result

class TestHBaseTester(TestCase):

def setUp(self):

self.writer = HBaseTester("localhost", 9090)

def tearDown(self):

name = self.writer.tableName

client = self.writer.client

client.disableTable(name)

client.deleteTable(name)

def testCreate(self):

tableName = self.writer.tableName

client = self.writer.client

self.assertTrue(self.writer.tableName in client.getTableNames())

columns =['name:','foo:']

for i in client.getColumnDescriptors(tableName):

self.assertTrue(i in columns)

def testPut(self):

self.writer.put("r1","n1","f1")

self.writer.put("r2","n2","f2")

self.writer.put("r3","n3","")

self.writer.scanner("name:")

if __name__ == "__main__":

main()

本文来源:https://www.2haoxitong.net/k/doc/8664a03b001ca300a6c30c22590102020740f2fb.html

《python 调用HBase 范例.doc》
将本文的Word文档下载到电脑,方便收藏和打印
推荐度:
点击下载文档

文档为doc格式