HBase表操作

相对于0.9.X版本，在HBase1.X版本对内部API改动比较大，例如连接部分类库变更，如下：

　　连接获取：org.apache.hadoop.hbase.HBaseConfiguration.createConnection(conf)已经过时，改为使用org.apache.hadoop.hbase.client.ConnectionFactory.createConnection(conf)；

　　表操作：org.apache.hadoop.hbase.client.HTable已过时，改为使用org.apache.hadoop.hbase.client.HTable接口；

第一部分：连接获取

package com.mengyao.bigdata.hbase;

import java.io.IOException;

import org.apache.hadoop.conf.Configuration;

import org.apache.hadoop.hbase.HBaseConfiguration;

import org.apache.hadoop.hbase.client.Connection;

import org.apache.hadoop.hbase.client.ConnectionFactory;

/**

 *

 * @author mengyao

 *

 */

public class HBaseHelper {

    private static final String QUORUM = "hbase.zookeeper.quorum";

    private static final String ZK_PORT = "hbase.zookeeper.property.clientPort";

    private String quorum;

    private String zkPort;

    private Configuration conf;

    public HBaseHelper(Configuration conf) {

        this.conf = conf;

    }

    public HBaseHelper(String quorum, String zkPort) {

        this.quorum = quorum;

        this.zkPort = zkPort;

    }

    public HBaseHelper(Configuration conf, String quorum, String zkPort) {

        this.conf = conf;

        this.quorum = quorum;

        this.zkPort = zkPort;

    }

    /**

     *

     * @param conf

     * @return

     * @throws IOException

     */

    public Connection getConnection() throws IOException {

        if (null == conf) {

            conf = HBaseConfiguration.create();

            conf.set(QUORUM, quorum);

            conf.set(ZK_PORT, zkPort);

        }

        if (null == conf.get(QUORUM) || conf.get(QUORUM).isEmpty()) {

            conf.set(QUORUM, quorum);

        }

        if (null == conf.get(ZK_PORT) || conf.get(ZK_PORT).isEmpty()) {

            conf.set(ZK_PORT, zkPort);

        }

        return ConnectionFactory.createConnection(conf);

    }

    /**

     *

     * @param connection

     * @throws IOException

     */

    public void closeAll(Connection connection) throws IOException {

        if (!connection.isClosed()) {

            connection.close();

        }

    }

    public String getQuorum() {

        return quorum;

    }

    public void setQuorum(String quorum) {

        this.quorum = quorum;

    }

    public String getZkPort() {

        return zkPort;

    }

    public void setZkPort(String zkPort) {

        this.zkPort = zkPort;

    }

}

第二部分：表数据增删改查

package com.mengyao.bigdata.hbase;

import java.io.IOException;

import java.util.ArrayList;

import java.util.Collection;

import java.util.HashMap;

import java.util.List;

import java.util.Map;

import java.util.Map.Entry;

import org.apache.hadoop.conf.Configuration;

import org.apache.hadoop.hbase.Cell;

import org.apache.hadoop.hbase.CellUtil;

import org.apache.hadoop.hbase.HBaseConfiguration;

import org.apache.hadoop.hbase.TableName;

import org.apache.hadoop.hbase.client.Connection;

import org.apache.hadoop.hbase.client.Delete;

import org.apache.hadoop.hbase.client.Get;

import org.apache.hadoop.hbase.client.Put;

import org.apache.hadoop.hbase.client.Result;

import org.apache.hadoop.hbase.client.ResultScanner;

import org.apache.hadoop.hbase.client.Scan;

import org.apache.hadoop.hbase.client.Table;

import org.apache.hadoop.hbase.filter.CompareFilter.CompareOp;

import org.apache.hadoop.hbase.filter.SingleColumnValueFilter;

import org.apache.hadoop.hbase.util.Bytes;

import org.apache.log4j.Logger;

/**

 * HBase version:1.0.1.1

 * @author mengyao

 *

 */

public class HBaseV1011Template {

    Logger logger = Logger.getLogger(getClass());

    private static Connection connection;

    static {

        Configuration conf = HBaseConfiguration.create();

        conf.set("hbase.zookeeper.quorum", "bdata200,bdata202,bdata203");

        conf.set("hbase.zookeeper.property.clientPort", "2181");

        HBaseHelper hBaseHelper = new HBaseHelper(conf);

        try {

            connection = hBaseHelper.getConnection();

        } catch (IOException e) {

            e.printStackTrace();

        }

    }

    public static void main(String[] args) throws IOException {

        //单行添加

        Map<String, String> keyValue = new HashMap<>();

        keyValue.put("name", "xiaogang");

        keyValue.put("sex", "男");

        keyValue.put("addr", "北京");

        add("test", "0005", "info", keyValue);

        //多行添加

        Map<String, Map<String, String>> keyValues = new HashMap<String, Map<String, String>>();

        Map<String, String> keyValue1 = new HashMap<>();

        keyValue1.put("name", "ligang");

        keyValue1.put("sex", "男");

        keyValue1.put("addr", "北京");

        keyValues.put("0008_info", keyValue1);

        Map<String, String> keyValue2 = new HashMap<>();

        keyValue2.put("name", "zhaojun");

        keyValue2.put("sex", "男");

        keyValue2.put("addr", "北京");

        keyValues.put("0009_info", keyValue2);

        adds("test", "_", keyValues);

        //查询所有

        System.out.println("1:"+queryForScan("test", "info"));

        //根据rowKey查询

        System.out.println("2:"+queryForRowKey("test", "0005", "info"));

        //根据时间戳范围查询（默认包钱不包后）

        System.out.println("3:"+queryForTimeRange("test", "info", 1492510703521L, 1492664183955L));

        //根据rowKey查询（默认包前不包后）

        System.out.println("4:"+queryForRowKeyRange("test", "info", "0001", "0003"));

        //根据指定列名和列值查询1

        System.out.println("5:"+queryForQuilfier("test", "info", "name", "xiaoming"));

        //根据指定列名和列值查询1

        System.out.println("6:"+queryForQuilfier("test", "info", "sex", "男"));

        //根据指定列名和列值查询1

        System.out.println("7:"+queryForQuilfier("test", "info", "sex", "女"));

        //根据rowKey删除

        deleteByRowKey("test", "0005", "info");

    }

    /**

     * 单行添加

     * @param tableName

     * @param rowKey

     * @param family

     * @param keyValue

     * @throws IOException

     */

    private static void add(String tableName, String rowKey, String family, Map<String, String> keyValue) throws IOException {

        Table table = connection.getTable(TableName.valueOf(tableName));

        Put put = new Put(Bytes.toBytes(rowKey));

        for (Entry<String, String> entry : keyValue.entrySet()) {

            put.addColumn(Bytes.toBytes(family), Bytes.toBytes(entry.getKey()), Bytes.toBytes(entry.getValue()));

        }

        table.put(put);

        table.close();

        keyValue.clear();

    }

    private static void adds(String tableName, String rowFamilySeparator, Map<String, Map<String, String>> keyValues) throws IOException {

        Table table = connection.getTable(TableName.valueOf(tableName));

        List<Put> puts = new ArrayList<Put>();

        for (Entry<String, Map<String, String>> entry : keyValues.entrySet()) {

            String key = entry.getKey();

            if (null == rowFamilySeparator || rowFamilySeparator.isEmpty()) {

                rowFamilySeparator = "_";

            }

            String rowKey = key.split(rowFamilySeparator)[0];

            String family = key.split(rowFamilySeparator)[1];

            Map<String, String> keyValue = entry.getValue();

            Put put = new Put(Bytes.toBytes(rowKey), System.currentTimeMillis());

            for (Entry<String, String> entry2 : keyValue.entrySet()) {

                put.addColumn(Bytes.toBytes(family), Bytes.toBytes(entry2.getKey()), Bytes.toBytes(entry2.getValue()));

            }

            puts.add(put);

        }

        table.put(puts);

        table.close();

        keyValues.clear();

    }

    /**

     * 单行删除

     * @param tableName

     * @param rowKey

     * @param family

     * @throws IOException

     */

    private static void deleteByRowKey(String tableName, String rowKey, String family) throws IOException {

        Table table = connection.getTable(TableName.valueOf(tableName));

        Delete delete = new Delete(Bytes.toBytes(rowKey));

        table.delete(delete);

        table.close();

    }

    /**

     * 查询所有

     * @param tableName

     * @param family

     * @return

     * @throws IOException

     */

    public static List<Map<String, String>> queryForScan(String tableName, String family) throws IOException {

        List<Map<String, String>> rows = new ArrayList<Map<String, String>>();

        Table table = connection.getTable(TableName.valueOf(tableName));

        Scan scan = new Scan();

        scan.addFamily(Bytes.toBytes(family));

        ResultScanner rs = table.getScanner(scan);

        Map<String, String> row = null;

        try {

            for (Result r = rs.next(); r != null; r = rs.next()) {

                Cell[] cells = r.rawCells();

                for (Cell cell : cells) {

                    row = new HashMap<String, String>();

                    row.put("timestamp", cell.getTimestamp() + "");

                    row.put("rowKey", new String(CellUtil.cloneRow(cell)));

                    row.put("family", new String(CellUtil.cloneFamily(cell)));

                    row.put(new String(CellUtil.cloneQualifier(cell)), new String(CellUtil.cloneValue(cell)));

                    rows.add(row);

                }

            }

        } finally {

            rs.close();

        }

        return rows;

    }

    /**

     * 根据时间范围

     * @param tableName

     * @param family

     * @param minStamp

     * @param maxStamp

     * @return

     * @throws IOException

     */

    public static List<Map<String, String>> queryForTimeRange(String tableName, String family, long minStamp, long maxStamp) throws IOException {

        List<Map<String, String>> rows = new ArrayList<Map<String, String>>();

        Table table = connection.getTable(TableName.valueOf(tableName));

        Scan scan = new Scan();

        scan.addFamily(Bytes.toBytes(family));

        scan.setTimeRange(minStamp, maxStamp);

        ResultScanner rs = table.getScanner(scan);

        Map<String, String> row = null;

        try {

            for (Result r = rs.next(); r != null; r = rs.next()) {

                Cell[] cells = r.rawCells();

                for (Cell cell : cells) {

                    row = new HashMap<String, String>();

                    row.put("timestamp", cell.getTimestamp() + "");

                    row.put("rowKey", new String(CellUtil.cloneRow(cell)));

                    row.put("family", new String(CellUtil.cloneFamily(cell)));

                    row.put(new String(CellUtil.cloneQualifier(cell)), new String(CellUtil.cloneValue(cell)));

                    rows.add(row);

                }

            }

        } finally {

            rs.close();

        }

        return rows;

    }

    /**

     * 根据RowKey查询

     * @param tableName

     * @param rowKey

     * @param family

     * @return

     * @throws IOException

     */

    public static Map<String, String> queryForRowKey(String tableName, String rowKey, String family) throws IOException {

        Table table = connection.getTable(TableName.valueOf(tableName));

        Get get = new Get(Bytes.toBytes(rowKey));

        get.addFamily(Bytes.toBytes(family));

        Scan scan = new Scan(get);

        ResultScanner rs = table.getScanner(scan);

        Map<String, String> row = null;

        try {

            for (Result r = rs.next(); r != null; r = rs.next()) {

                Cell[] cells = r.rawCells();

                row = new HashMap<String, String>();

                for (Cell cell : cells) {

                    row.put("timestamp", cell.getTimestamp() + "");

                    row.put("rowKey", new String(CellUtil.cloneRow(cell)));

                    row.put("family", new String(CellUtil.cloneFamily(cell)));

                    row.put(new String(CellUtil.cloneQualifier(cell)), new String(CellUtil.cloneValue(cell)));

                }

            }

        } finally {

            rs.close();

        }

        return row;

    }

    /**

     * 根据RowKey范围查询

     * @param tableName

     * @param family

     * @param startRow

     * @param stopRow

     * @return

     * @throws IOException

     */

    public static List<Map<String, String>> queryForRowKeyRange(String tableName, String family, String startRow, String stopRow) throws IOException {

        List<Map<String, String>> rows = new ArrayList<Map<String, String>>();

        Table table = connection.getTable(TableName.valueOf(tableName));

        Scan scan = new Scan();

        scan.addFamily(Bytes.toBytes(family));

        scan.setStartRow(Bytes.toBytes(startRow));

        scan.setStopRow(Bytes.toBytes(stopRow));

        ResultScanner rs = table.getScanner(scan);

        Map<String, String> row = null;

        try {

            for (Result r = rs.next(); r != null; r = rs.next()) {

                Cell[] cells = r.rawCells();

                for (Cell cell : cells) {

                    row = new HashMap<String, String>();

                    row.put("timestamp", cell.getTimestamp() + "");

                    row.put("rowKey", new String(CellUtil.cloneRow(cell)));

                    row.put("family", new String(CellUtil.cloneFamily(cell)));

                    row.put(new String(CellUtil.cloneQualifier(cell)), new String(CellUtil.cloneValue(cell)));

                    rows.add(row);

                }

            }

        } finally {

            rs.close();

        }

        return rows;

    }

    /**

     * 根据指定列名匹配列值

     * @param tableName

     * @param family

     * @param qualifier

     * @param value

     * @return

     * @throws IOException

     */

    public static Collection<Map<String, String>> queryForQuilfier(String tableName, String family, String qualifier, String value) throws IOException {

        Map<String, Map<String, String>> rows = new HashMap<String, Map<String, String>>();

        Table table = connection.getTable(TableName.valueOf(tableName));

        Scan scan = new Scan();

        SingleColumnValueFilter filter = new SingleColumnValueFilter(Bytes.toBytes(family), Bytes.toBytes(qualifier), CompareOp.EQUAL, Bytes.toBytes(value));

        filter.setFilterIfMissing(true);

        scan.setFilter(filter);

        ResultScanner rs = table.getScanner(scan);

        Map<String, String> row = null;

        try {

            for (Result r = rs.next(); r != null; r = rs.next()) {

                Cell[] cells = r.rawCells();

                for (Cell cell : cells) {

                    String rowKey = new String(CellUtil.cloneRow(cell));

                    if (null == row || !rows.containsKey(rowKey)) {

                        row = new HashMap<String, String>();

                    }

                    row.put("timestamp", cell.getTimestamp() + "");

                    row.put("rowKey", rowKey);

                    row.put("family", new String(CellUtil.cloneFamily(cell)));

                    row.put(new String(CellUtil.cloneQualifier(cell)), new String(CellUtil.cloneValue(cell)));

                    rows.put(rowKey,row);

                }

            }

        } finally {

            rs.close();

        }

        return rows.values();

    }

}

HBase表操作的更多相关文章

Hbase 表操作
1. list 操作 2. 创建table column family, 3. 插入数据: put 'user' 3. 检索数据: scan table
hadoop执行hdfs文件到hbase表插入操作(xjl456852原创)
本例中需要将hdfs上的文本文件,解析后插入到hbase的表中. 本例用到的hadoop版本2.7.2 hbase版本1.2.2 hbase的表如下: create 'ns2:user', 'info ...
hbase操作（shell 命令，如建表，清空表，增删改查）以及 hbase表存储结构和原理
两篇讲的不错文章 http://www.cnblogs.com/nexiyi/p/hbase_shell.html http://blog.csdn.net/u010967382/article/de ...
HBase性能优化方法总结（二）：写表操作
转自:http://www.cnblogs.com/panfeng412/archive/2012/03/08/hbase-performance-tuning-section2.html 本文主要是 ...
HBase性能优化方法总结（三）：读表操作
本文主要是从HBase应用程序设计与开发的角度,总结几种常用的性能优化方法.有关HBase系统配置级别的优化,可参考:淘宝Ken Wu同学的博客. 下面是本文总结的第三部分内容:读表操作相关的优化方法 ...
云计算与大数据实验：Hbase shell操作用户表
[实验目的] 1)了解hbase服务 2)学会hbase shell命令操作用户表 [实验原理] HBase是一个分布式的.面向列的开源数据库,它利用Hadoop HDFS作为其文件存储系统,利用Ha ...
云计算与大数据实验：Hbase shell操作成绩表
[实验目的] 1)了解hbase服务 2)学会hbase shell命令操作成绩表 [实验原理] HBase是一个分布式的.面向列的开源数据库,它利用Hadoop HDFS作为其文件存储系统,利用Ha ...
HBase性能优化方法总结（三）：读表操作（转）
转自:http://www.cnblogs.com/panfeng412/archive/2012/03/08/hbase-performance-tuning-section3.html 本文主要是 ...
HBase表的基本结构和常用命令行操作
一.HBase表的基本结构 1.概述: 平时常见的MySQL.Oracle数据库都是传统型关系数据库,它们都是按行查询.按行存储:而HBase为非关系型数据库,它是按列存储的的. 在HBase插入数据 ...

随机推荐

[CH5302]金字塔
题面虽然探索金字塔是极其老套的剧情,但是有一队探险家还是到了某金字塔脚下.经过多年的研究,科学家对这座金字塔的内部结构已经有所了解.首先,金字塔由若干房间组成,房间之间连有通道.如果把房间看作节点, ...
机器学习实战一：kNN手写识别系统
实战一:kNN手写识别系统本文将一步步地构造使用K-近邻分类器的手写识别系统.由于能力有限,这里构造的系统只能识别0-9.需要识别的数字已经使用图形处理软件,处理成具有相同的色彩和大小:32像素*3 ...
spring与mybatis整合(基于配置文件)
本文主要介绍了如何将mybatis和spring整合在一起使用,本人使用的是mybatis3.05 + spring3.1.0M2 ,使用dbcp作为数据库连接池. 1.编写数据访问接口(UserDa ...
ubutu下source命令问题（复制）
最近一段时间在使用Bash on Ubuntu on Windows做shell脚本调试时发现在脚本中使用source时会报错,上网查了下才了解到原来是在Ubuntu中使用的并不是bash,而是使用 ...
HDU 1398 Square Coins 整数拆分变形母函数
欢迎参加——BestCoder周年纪念赛(高质量题目+多重奖励) Square Coins Time Limit: 2000/1000 MS (Java/Others) Memory Limit ...
PAT 甲级 1003 Emergency
https://pintia.cn/problem-sets/994805342720868352/problems/994805523835109376 As an emergency rescue ...
【历史】- 一段关于 Unix、Linux 和 Windows 的暗黑史
“SCO在言语上变得越来越好斗,而且还拒绝展示有关诉讼的任何证据,一切都似乎在表明,SCO只不过是在那里拉虎皮做大旗地狂言乱语.但是,微软决不会轻易放弃这么可以一个利用这些狂言乱语的好机会.”2003 ...
关于C标准
关于C标准 1. 前言本文从英文 C-FAQ (2004 年 7 月 3 日修订版) 翻译而来.本文的中文版权为朱群英和孙云所有. 本文的内容可以自由用于个人目的,但是不可以未经许可出版发行. ...
java生成和解析二维码
前言现在,二维码的应用已经非常广泛,在线生成器也是诸多,随手生成. 所以就和大家分享一个小案例,用zxing来做一个的二维码生成器,当然这个例子是比较简单,若是写的不好请多多包涵. ZXING项目是 ...
制作用于日期时间型字段的DELPHI数据感知控件
用DELPHI开发C/S应用方便而快速,因为它拥有大量易于使用的数据访问和数据感知控件.然而万事总是难以完美,DELPHI的DBEdit控件用于输入日期时间型字段却很不方便,为了改善这一缺点,笔者开发 ...

HBase表操作

HBase表操作的更多相关文章

随机推荐

热门专题