hbase手动compact与split
#!/bin/bash
die () {
echo >&2 "$@"
echo "usage:"
echo " $0 check|split table_name [split_size]"
exit 1
}
[[ "$#" -lt 2 ]] && die "at least 2 arguments required, $# provided"
COMMAND=$1
TABLE=$2
SIZE="${3:-1073741824}"
split() {
region_key=`python /home/hduser/hbase/hbase-scan.py -t hbase:meta -f "RowFilter (=, 'substring:$1')"`
echo "split '$region_key'" | hbase shell
}
if [ "$COMMAND" != "check" ] ; then
for region in `hadoop fs -ls /hbase/data/default/$TABLE | awk {'print $8'}`
do
[[ ${region##*/} =~ ^\. ]] && continue
[[ `hadoop fs -du -s $region | awk {'print $1'}` -gt $SIZE ]] && split ${region##*/}
done
# check after split
sleep 60
fi
for region in `hadoop fs -ls /hbase/data/default/$TABLE | awk {'print $8'}`
do
[[ ${region##*/} =~ ^\. ]] && continue
[[ `hadoop fs -du -s $region | awk {'print $1'}` -gt $SIZE ]] && echo "${region##*/} (`hadoop fs -du -s -h $region | awk {'print $1 $2'}`) is a huge region" || echo "${region##*/} (`hadoop fs -du -s -h $region | awk {'print $1 $2'}`) is a small region"
done
专注于为中小企业提供成都网站制作、做网站服务,电脑端+手机端+微信端的三站合一,更高效的管理,为中小企业南安免费做网站提供优质的服务。我们立足成都,凝聚了一批互联网行业人才,有力地推动了超过千家企业的稳健成长,帮助中小企业通过网站建设实现规模扩充和转变。
hbase-scan.py
import subprocess
import datetime
import argparse
import csv
import gzip
import happybase
import logging
def connect_to_hbase():
return happybase.Connection('itr-hbasetest01')
def main():
logging.basicConfig(format='%(asctime)s %(name)s %(levelname)s: %(message)s',level=logging.INFO)
argp = argparse.ArgumentParser(description='EventLog Reader')
argp.add_argument('-t','--table', dest='table', default='eventlog')
argp.add_argument('-p','--prefix', dest='prefix')
argp.add_argument('-f','--filter', dest='filter')
argp.add_argument('-l','--limit', dest='limit', default=10)
args = argp.parse_args()
hbase_conn = connect_to_hbase()
table = hbase_conn.table(args.table)
logging.info("scan start")
scanner = table.scan(row_prefix=args.prefix, batch_size=1000, limit=int(args.limit), filter=args.filter)
logging.info("scan done")
i = 0
for key, data in scanner:
logging.info(key)
print key
i+=1
logging.info('%s rows read in total', i)
if __name__ == '__main__':
main()
分享名称:hbase手动compact与split
网页URL:http://www.jxjierui.cn/article/iijigo.html


咨询
建站咨询
