发布时间:2019-08-31 09:44:28编辑:auto阅读(1536)
利用Python调用HBASE的 需要安装thrift hbase-thrift
启动hbase的thrift服务:bin/hbase-daemon.sh start thrift 默认端口是9090
mysql 到hbase的数据同步:
1、put
2、Importtsv
3、编写MapReduce Job导入
4、sqoop
简单code:
#!/usr/bin/env python
#coding=utf-8
import sys
sys.path.append('/usr/lib/python2.6/site-packages/hbase')
from thrift import Thrift
from thrift.transport import TSocket
from thrift.transport import TTransport
from thrift.protocol import TBinaryProtocol
from hbase import Hbase
from hbase.ttypes import *
import csv
from hbase.ttypes import ColumnDescriptor, Mutation, BatchMutation, TRegionInfo
from hbase.ttypes import IOError, AlreadyExists
######
def client_conn():
transport=TSocket.TSocket("172.16.10.87",9090)
transport=TTransport.TBufferedTransport(transport)
protocol=TBinaryProtocol.TBinaryProtocol(transport)
client=Hbase.Client(protocol)
transport.open()
return client
def __del__():
transport.close()
if __name__=="__main__":
client=client_conn()
#获取表名字
print client.getTableNames()
##创建表
#client.createTable('name2',[ColumnDescriptor(name="user_id:",maxVersions=1),ColumnDescriptor(name="user_name"),])
#写入数据
client.mutateRow('name2','a1',[Mutation(column='user_id:1',value="1")])
client.mutateRow('ca_record','1',[Mutation(column='user_id:0',value='5')])
##获取数据
aa=client.getRow('name2','a1')
for r in aa:
print 'row',r.row
print '\br'
print 'value',r.columns.get("user_id:1").value
##删除表
#client.disableTable("t1")
#client.deleteTable("t1")
print client.getTableNames()
###获取表的行键值
#print client.scannerGet(client.scannerOpen('t2',"cmd",["a"]))
print client.scannerGet(client.scannerOpen('t2',"",["a"])) #当row key为空取第一个
print "------"
print client.getColumnDescriptors('t3')
#在自己开发环境 只要安装好thrift 及hbase-thrift的包,在import的时候不会出问题
上一篇: python练习记录
下一篇: python入门(四)
48876
47943
38724
35865
30292
27048
26075
20911
20717
19076
515°
614°
618°
620°
597°
581°
650°
720°
840°
948°