HBase表操作

相对于0.9.X版本，在HBase1.X版本对内部API改动比较大，例如连接部分类库变更，如下：

　　连接获取：org.apache.hadoop.hbase.HBaseConfiguration.createConnection(conf)已经过时，改为使用org.apache.hadoop.hbase.client.ConnectionFactory.createConnection(conf)；

　　表操作：org.apache.hadoop.hbase.client.HTable已过时，改为使用org.apache.hadoop.hbase.client.HTable接口；

第一部分：连接获取

package com.mengyao.bigdata.hbase;

import java.io.IOException;

import org.apache.hadoop.conf.Configuration;

import org.apache.hadoop.hbase.HBaseConfiguration;

import org.apache.hadoop.hbase.client.Connection;

import org.apache.hadoop.hbase.client.ConnectionFactory;

/**

 *

 * @author mengyao

 *

 */

public class HBaseHelper {

    private static final String QUORUM = "hbase.zookeeper.quorum";

    private static final String ZK_PORT = "hbase.zookeeper.property.clientPort";

    private String quorum;

    private String zkPort;

    private Configuration conf;

    public HBaseHelper(Configuration conf) {

        this.conf = conf;

    }

    public HBaseHelper(String quorum, String zkPort) {

        this.quorum = quorum;

        this.zkPort = zkPort;

    }

    public HBaseHelper(Configuration conf, String quorum, String zkPort) {

        this.conf = conf;

        this.quorum = quorum;

        this.zkPort = zkPort;

    }

    /**

     *

     * @param conf

     * @return

     * @throws IOException

     */

    public Connection getConnection() throws IOException {

        if (null == conf) {

            conf = HBaseConfiguration.create();

            conf.set(QUORUM, quorum);

            conf.set(ZK_PORT, zkPort);

        }

        if (null == conf.get(QUORUM) || conf.get(QUORUM).isEmpty()) {

            conf.set(QUORUM, quorum);

        }

        if (null == conf.get(ZK_PORT) || conf.get(ZK_PORT).isEmpty()) {

            conf.set(ZK_PORT, zkPort);

        }

        return ConnectionFactory.createConnection(conf);

    }

    /**

     *

     * @param connection

     * @throws IOException

     */

    public void closeAll(Connection connection) throws IOException {

        if (!connection.isClosed()) {

            connection.close();

        }

    }

    public String getQuorum() {

        return quorum;

    }

    public void setQuorum(String quorum) {

        this.quorum = quorum;

    }

    public String getZkPort() {

        return zkPort;

    }

    public void setZkPort(String zkPort) {

        this.zkPort = zkPort;

    }

}

第二部分：表数据增删改查

package com.mengyao.bigdata.hbase;

import java.io.IOException;

import java.util.ArrayList;

import java.util.Collection;

import java.util.HashMap;

import java.util.List;

import java.util.Map;

import java.util.Map.Entry;

import org.apache.hadoop.conf.Configuration;

import org.apache.hadoop.hbase.Cell;

import org.apache.hadoop.hbase.CellUtil;

import org.apache.hadoop.hbase.HBaseConfiguration;

import org.apache.hadoop.hbase.TableName;

import org.apache.hadoop.hbase.client.Connection;

import org.apache.hadoop.hbase.client.Delete;

import org.apache.hadoop.hbase.client.Get;

import org.apache.hadoop.hbase.client.Put;

import org.apache.hadoop.hbase.client.Result;

import org.apache.hadoop.hbase.client.ResultScanner;

import org.apache.hadoop.hbase.client.Scan;

import org.apache.hadoop.hbase.client.Table;

import org.apache.hadoop.hbase.filter.CompareFilter.CompareOp;

import org.apache.hadoop.hbase.filter.SingleColumnValueFilter;

import org.apache.hadoop.hbase.util.Bytes;

import org.apache.log4j.Logger;

/**

 * HBase version:1.0.1.1

 * @author mengyao

 *

 */

public class HBaseV1011Template {

    Logger logger = Logger.getLogger(getClass());

    private static Connection connection;

    static {

        Configuration conf = HBaseConfiguration.create();

        conf.set("hbase.zookeeper.quorum", "bdata200,bdata202,bdata203");

        conf.set("hbase.zookeeper.property.clientPort", "2181");

        HBaseHelper hBaseHelper = new HBaseHelper(conf);

        try {

            connection = hBaseHelper.getConnection();

        } catch (IOException e) {

            e.printStackTrace();

        }

    }

    public static void main(String[] args) throws IOException {

        //单行添加

        Map<String, String> keyValue = new HashMap<>();

        keyValue.put("name", "xiaogang");

        keyValue.put("sex", "男");

        keyValue.put("addr", "北京");

        add("test", "0005", "info", keyValue);

        //多行添加

        Map<String, Map<String, String>> keyValues = new HashMap<String, Map<String, String>>();

        Map<String, String> keyValue1 = new HashMap<>();

        keyValue1.put("name", "ligang");

        keyValue1.put("sex", "男");

        keyValue1.put("addr", "北京");

        keyValues.put("0008_info", keyValue1);

        Map<String, String> keyValue2 = new HashMap<>();

        keyValue2.put("name", "zhaojun");

        keyValue2.put("sex", "男");

        keyValue2.put("addr", "北京");

        keyValues.put("0009_info", keyValue2);

        adds("test", "_", keyValues);

        //查询所有

        System.out.println("1:"+queryForScan("test", "info"));

        //根据rowKey查询

        System.out.println("2:"+queryForRowKey("test", "0005", "info"));

        //根据时间戳范围查询（默认包钱不包后）

        System.out.println("3:"+queryForTimeRange("test", "info", 1492510703521L, 1492664183955L));

        //根据rowKey查询（默认包前不包后）

        System.out.println("4:"+queryForRowKeyRange("test", "info", "0001", "0003"));

        //根据指定列名和列值查询1

        System.out.println("5:"+queryForQuilfier("test", "info", "name", "xiaoming"));

        //根据指定列名和列值查询1

        System.out.println("6:"+queryForQuilfier("test", "info", "sex", "男"));

        //根据指定列名和列值查询1

        System.out.println("7:"+queryForQuilfier("test", "info", "sex", "女"));

        //根据rowKey删除

        deleteByRowKey("test", "0005", "info");

    }

    /**

     * 单行添加

     * @param tableName

     * @param rowKey

     * @param family

     * @param keyValue

     * @throws IOException

     */

    private static void add(String tableName, String rowKey, String family, Map<String, String> keyValue) throws IOException {

        Table table = connection.getTable(TableName.valueOf(tableName));

        Put put = new Put(Bytes.toBytes(rowKey));

        for (Entry<String, String> entry : keyValue.entrySet()) {

            put.addColumn(Bytes.toBytes(family), Bytes.toBytes(entry.getKey()), Bytes.toBytes(entry.getValue()));

        }

        table.put(put);

        table.close();

        keyValue.clear();

    }

    private static void adds(String tableName, String rowFamilySeparator, Map<String, Map<String, String>> keyValues) throws IOException {

        Table table = connection.getTable(TableName.valueOf(tableName));

        List<Put> puts = new ArrayList<Put>();

        for (Entry<String, Map<String, String>> entry : keyValues.entrySet()) {

            String key = entry.getKey();

            if (null == rowFamilySeparator || rowFamilySeparator.isEmpty()) {

                rowFamilySeparator = "_";

            }

            String rowKey = key.split(rowFamilySeparator)[0];

            String family = key.split(rowFamilySeparator)[1];

            Map<String, String> keyValue = entry.getValue();

            Put put = new Put(Bytes.toBytes(rowKey), System.currentTimeMillis());

            for (Entry<String, String> entry2 : keyValue.entrySet()) {

                put.addColumn(Bytes.toBytes(family), Bytes.toBytes(entry2.getKey()), Bytes.toBytes(entry2.getValue()));

            }

            puts.add(put);

        }

        table.put(puts);

        table.close();

        keyValues.clear();

    }

    /**

     * 单行删除

     * @param tableName

     * @param rowKey

     * @param family

     * @throws IOException

     */

    private static void deleteByRowKey(String tableName, String rowKey, String family) throws IOException {

        Table table = connection.getTable(TableName.valueOf(tableName));

        Delete delete = new Delete(Bytes.toBytes(rowKey));

        table.delete(delete);

        table.close();

    }

    /**

     * 查询所有

     * @param tableName

     * @param family

     * @return

     * @throws IOException

     */

    public static List<Map<String, String>> queryForScan(String tableName, String family) throws IOException {

        List<Map<String, String>> rows = new ArrayList<Map<String, String>>();

        Table table = connection.getTable(TableName.valueOf(tableName));

        Scan scan = new Scan();

        scan.addFamily(Bytes.toBytes(family));

        ResultScanner rs = table.getScanner(scan);

        Map<String, String> row = null;

        try {

            for (Result r = rs.next(); r != null; r = rs.next()) {

                Cell[] cells = r.rawCells();

                for (Cell cell : cells) {

                    row = new HashMap<String, String>();

                    row.put("timestamp", cell.getTimestamp() + "");

                    row.put("rowKey", new String(CellUtil.cloneRow(cell)));

                    row.put("family", new String(CellUtil.cloneFamily(cell)));

                    row.put(new String(CellUtil.cloneQualifier(cell)), new String(CellUtil.cloneValue(cell)));

                    rows.add(row);

                }

            }

        } finally {

            rs.close();

        }

        return rows;

    }

    /**

     * 根据时间范围

     * @param tableName

     * @param family

     * @param minStamp

     * @param maxStamp

     * @return

     * @throws IOException

     */

    public static List<Map<String, String>> queryForTimeRange(String tableName, String family, long minStamp, long maxStamp) throws IOException {

        List<Map<String, String>> rows = new ArrayList<Map<String, String>>();

        Table table = connection.getTable(TableName.valueOf(tableName));

        Scan scan = new Scan();

        scan.addFamily(Bytes.toBytes(family));

        scan.setTimeRange(minStamp, maxStamp);

        ResultScanner rs = table.getScanner(scan);

        Map<String, String> row = null;

        try {

            for (Result r = rs.next(); r != null; r = rs.next()) {

                Cell[] cells = r.rawCells();

                for (Cell cell : cells) {

                    row = new HashMap<String, String>();

                    row.put("timestamp", cell.getTimestamp() + "");

                    row.put("rowKey", new String(CellUtil.cloneRow(cell)));

                    row.put("family", new String(CellUtil.cloneFamily(cell)));

                    row.put(new String(CellUtil.cloneQualifier(cell)), new String(CellUtil.cloneValue(cell)));

                    rows.add(row);

                }

            }

        } finally {

            rs.close();

        }

        return rows;

    }

    /**

     * 根据RowKey查询

     * @param tableName

     * @param rowKey

     * @param family

     * @return

     * @throws IOException

     */

    public static Map<String, String> queryForRowKey(String tableName, String rowKey, String family) throws IOException {

        Table table = connection.getTable(TableName.valueOf(tableName));

        Get get = new Get(Bytes.toBytes(rowKey));

        get.addFamily(Bytes.toBytes(family));

        Scan scan = new Scan(get);

        ResultScanner rs = table.getScanner(scan);

        Map<String, String> row = null;

        try {

            for (Result r = rs.next(); r != null; r = rs.next()) {

                Cell[] cells = r.rawCells();

                row = new HashMap<String, String>();

                for (Cell cell : cells) {

                    row.put("timestamp", cell.getTimestamp() + "");

                    row.put("rowKey", new String(CellUtil.cloneRow(cell)));

                    row.put("family", new String(CellUtil.cloneFamily(cell)));

                    row.put(new String(CellUtil.cloneQualifier(cell)), new String(CellUtil.cloneValue(cell)));

                }

            }

        } finally {

            rs.close();

        }

        return row;

    }

    /**

     * 根据RowKey范围查询

     * @param tableName

     * @param family

     * @param startRow

     * @param stopRow

     * @return

     * @throws IOException

     */

    public static List<Map<String, String>> queryForRowKeyRange(String tableName, String family, String startRow, String stopRow) throws IOException {

        List<Map<String, String>> rows = new ArrayList<Map<String, String>>();

        Table table = connection.getTable(TableName.valueOf(tableName));

        Scan scan = new Scan();

        scan.addFamily(Bytes.toBytes(family));

        scan.setStartRow(Bytes.toBytes(startRow));

        scan.setStopRow(Bytes.toBytes(stopRow));

        ResultScanner rs = table.getScanner(scan);

        Map<String, String> row = null;

        try {

            for (Result r = rs.next(); r != null; r = rs.next()) {

                Cell[] cells = r.rawCells();

                for (Cell cell : cells) {

                    row = new HashMap<String, String>();

                    row.put("timestamp", cell.getTimestamp() + "");

                    row.put("rowKey", new String(CellUtil.cloneRow(cell)));

                    row.put("family", new String(CellUtil.cloneFamily(cell)));

                    row.put(new String(CellUtil.cloneQualifier(cell)), new String(CellUtil.cloneValue(cell)));

                    rows.add(row);

                }

            }

        } finally {

            rs.close();

        }

        return rows;

    }

    /**

     * 根据指定列名匹配列值

     * @param tableName

     * @param family

     * @param qualifier

     * @param value

     * @return

     * @throws IOException

     */

    public static Collection<Map<String, String>> queryForQuilfier(String tableName, String family, String qualifier, String value) throws IOException {

        Map<String, Map<String, String>> rows = new HashMap<String, Map<String, String>>();

        Table table = connection.getTable(TableName.valueOf(tableName));

        Scan scan = new Scan();

        SingleColumnValueFilter filter = new SingleColumnValueFilter(Bytes.toBytes(family), Bytes.toBytes(qualifier), CompareOp.EQUAL, Bytes.toBytes(value));

        filter.setFilterIfMissing(true);

        scan.setFilter(filter);

        ResultScanner rs = table.getScanner(scan);

        Map<String, String> row = null;

        try {

            for (Result r = rs.next(); r != null; r = rs.next()) {

                Cell[] cells = r.rawCells();

                for (Cell cell : cells) {

                    String rowKey = new String(CellUtil.cloneRow(cell));

                    if (null == row || !rows.containsKey(rowKey)) {

                        row = new HashMap<String, String>();

                    }

                    row.put("timestamp", cell.getTimestamp() + "");

                    row.put("rowKey", rowKey);

                    row.put("family", new String(CellUtil.cloneFamily(cell)));

                    row.put(new String(CellUtil.cloneQualifier(cell)), new String(CellUtil.cloneValue(cell)));

                    rows.put(rowKey,row);

                }

            }

        } finally {

            rs.close();

        }

        return rows.values();

    }

}

HBase表操作的更多相关文章

Hbase 表操作
1. list 操作 2. 创建table column family, 3. 插入数据: put 'user' 3. 检索数据: scan table
hadoop执行hdfs文件到hbase表插入操作(xjl456852原创)
本例中需要将hdfs上的文本文件,解析后插入到hbase的表中. 本例用到的hadoop版本2.7.2 hbase版本1.2.2 hbase的表如下: create 'ns2:user', 'info ...
hbase操作（shell 命令，如建表，清空表，增删改查）以及 hbase表存储结构和原理
两篇讲的不错文章 http://www.cnblogs.com/nexiyi/p/hbase_shell.html http://blog.csdn.net/u010967382/article/de ...
HBase性能优化方法总结（二）：写表操作
转自:http://www.cnblogs.com/panfeng412/archive/2012/03/08/hbase-performance-tuning-section2.html 本文主要是 ...
HBase性能优化方法总结（三）：读表操作
本文主要是从HBase应用程序设计与开发的角度,总结几种常用的性能优化方法.有关HBase系统配置级别的优化,可参考:淘宝Ken Wu同学的博客. 下面是本文总结的第三部分内容:读表操作相关的优化方法 ...
云计算与大数据实验：Hbase shell操作用户表
[实验目的] 1)了解hbase服务 2)学会hbase shell命令操作用户表 [实验原理] HBase是一个分布式的.面向列的开源数据库,它利用Hadoop HDFS作为其文件存储系统,利用Ha ...
云计算与大数据实验：Hbase shell操作成绩表
[实验目的] 1)了解hbase服务 2)学会hbase shell命令操作成绩表 [实验原理] HBase是一个分布式的.面向列的开源数据库,它利用Hadoop HDFS作为其文件存储系统,利用Ha ...
HBase性能优化方法总结（三）：读表操作（转）
转自:http://www.cnblogs.com/panfeng412/archive/2012/03/08/hbase-performance-tuning-section3.html 本文主要是 ...
HBase表的基本结构和常用命令行操作
一.HBase表的基本结构 1.概述: 平时常见的MySQL.Oracle数据库都是传统型关系数据库,它们都是按行查询.按行存储:而HBase为非关系型数据库,它是按列存储的的. 在HBase插入数据 ...

随机推荐

React Antd中样式的修改
如果需要对antd的样式进行修改, 进入你要修改的页面注意:不能直接在自己的文件下面,加入一个css,修改这个class的样式,应该加入global限定,global {} , 在{}里面写入 . ...
Selenium驱动Chrome浏览器
import org.openqa.selenium.By;import org.openqa.selenium.WebDriver;import org.openqa.selenium.chrome ...
深挖 NGUI 基础之UIRoot (一)
当你开始使用NGUI的时候,简单的从项目视图中一个”Control”预设体拖拽到场景视图中,你将会发现 Hierarchy层次面板中会出现以下层次结构: 其中 UI Root作为根节点,是每个NG ...
Java 集合学习--ArrayList
一.ArrayList 定义 ArrayList 是一个用数组实现的集合,支持随机访问,元素有序且可以重复. ①.实现 List 接口 List接口继承Collection接口,是List类的顶层接口 ...
tp5 常见问题模板文件路由
W:视图 Q:是MVC中的V,也就是在模块下面的view目录下的html文件,就是写的页面. W:模板 Q:视图在控制器的叫法,在fetch,display等方法中传入的模板参数最后传到视图. ...
MySQL训练营02
一.表操作: 1.MySQL表的数据类型: MySQL的数据类型分为3种: 数值时间/日期字符/字符串 (1)数值类型: 包括:TinyInt.SmallInt.MediumInt.Int.Big ...
MUI scroll 定位问题
做一个微信项目,使用MUI做框架,在使用scroll定位的时候,出现了定位不准确的问题,查询了好多资料,得知他是相对定位.折腾了好久,才搞定,现在做一个笔记. mui('body').on('tap' ...
multi-tap
multi-tap又称 multi-press . 是在手机,或者电视遥控上的keypad定义,有如下2类标准: 1. ITU-T E.161 2.T9 使用举例如下: Consider a typi ...
windows bat批处理基础命令学习教程(转载)
一.基础语法: 1.批处理文件是一个“.bat”结尾的文本文件,这个文件的每一行都是一条DOS命令.可以使用任何文本文件编辑工具创建和修改.2.批处理是一种简单的程序,可以用 if 和 goto 来控 ...
【考试记录】4.8 Path （网络流 —— 劲题）
手抄代码 + 学习指针 + 冥思苦想一晚上终于——在一瞬间开窍了.果然题目都是这样:突破了一个点,一切都是柳暗花明. 题面描述: 样例: 这道题目,首先注意到给定的边的性质:这些边在平面上构成了一棵树 ...

HBase表操作

HBase表操作的更多相关文章

随机推荐

热门专题