package db.insert; /* * 创建一个students表,并进行相关操作 */ import java.io.IOException; import java.io.Serializable; import java.util.ArrayList; import java.util.List; import org.apache.hadoop.conf.Configuration; import org.apache.hadoop.hbase.HBaseConfiguration; import org.apache.hadoop.hbase.HColumnDescriptor; import org.apache.hadoop.hbase.HTableDescriptor; import org.apache.hadoop.hbase.KeyValue; import org.apache.hadoop.hbase.MasterNotRunningException; import org.apache.hadoop.hbase.ZooKeeperConnectionException; import org.apache.hadoop.hbase.client.Delete; import org.apache.hadoop.hbase.client.Get; import org.apache.hadoop.hbase.client.HBaseAdmin; import org.apache.hadoop.hbase.client.HTable; import org.apache.hadoop.hbase.client.Put; import org.apache.hadoop.hbase.client.Result; import org.apache.hadoop.hbase.client.ResultScanner; import org.apache.hadoop.hbase.client.Scan; import org.apache.hadoop.hbase.util.Bytes; public class HBaseDBDao implements Serializable{ /** * */ private static final long serialVersionUID = 1L; // 声明静态配置 private static Configuration conf = null; private static HBaseAdmin hAdmin; private static HTable table; public HBaseDBDao(){ conf = HBaseConfiguration.create(); conf.set("hbase.zookeeper.quorum", "192.168.1.154"); conf.set("hbase.zookeeper.property.clientPort", "2181"); conf.set("hbase.master", "192.168.1.154:6000"); try { //初始化数据库管理员 hAdmin = new HBaseAdmin(conf); } catch (MasterNotRunningException e) { // TODO Auto-generated catch block e.printStackTrace(); } catch (ZooKeeperConnectionException e) { // TODO Auto-generated catch block e.printStackTrace(); } catch (IOException e) { // TODO Auto-generated catch block e.printStackTrace(); } } //初始化HTable,在插入数据,查询数据之前必须先初始化 public void initHTable(String tableName) throws IOException{ table = new HTable(conf, tableName); } //判断表是否存在 public boolean isExist(String tableName) throws IOException { return hAdmin.tableExists(tableName); } // 创建数据库表 public void createTable(String tableName, String[] columnFamilys) throws Exception { if (hAdmin.tableExists(tableName)) { System.out.println("表 "+tableName+" 已存在!"); System.exit(0); } else { // 新建一个表的描述 HTableDescriptor tableDesc = new HTableDescriptor(tableName); // 在描述里添加列族 for (String columnFamily : columnFamilys) { tableDesc.addFamily(new HColumnDescriptor(columnFamily)); } // 根据配置好的描述建表 hAdmin.createTable(tableDesc); System.out.println("创建表 "+tableName+" 成功!"); } } // 删除数据库表 public void deleteTable(String tableName) throws Exception { if (hAdmin.tableExists(tableName)) { // 关闭一个表 hAdmin.disableTable(tableName); hAdmin.deleteTable(tableName); System.out.println("删除表 "+tableName+" 成功!"); } else { System.out.println("删除的表 "+tableName+" 不存在!"); System.exit(0); } } // 批量添加数据 public void addRowBatch(String tableName, String row, String columnFamily, String column, String value) throws Exception { //将自动提交关闭,如果不关闭,每写一条数据都会进行提交,是导入数据较慢的主要因素 table.setAutoFlush(false, false); //设置缓存大小,当缓存大于设置值时,hbase会自动提交。此处可自己尝试大小,一般对大数据量,设置为5M即可,本文设置为3M。 table.setWriteBufferSize(5*1024*1024); Put put = new Put(Bytes.toBytes(row));// 指定行 // 参数分别:列族、列、值 put.add(Bytes.toBytes(columnFamily), Bytes.toBytes(column), Bytes.toBytes(value)); table.put(put); } //执行flushCommits()操作,防止最后一次数据丢失(尤其是在spark中一个分片结束时) public void flushCommits(String tableName) throws Exception { table.flushCommits(); } //添加一条数据 public void addRow(String tableName, String row, String columnFamily, String column, String value) throws Exception { Put put = new Put(Bytes.toBytes(row));// 指定行 // 参数分别:列族、列、值 put.add(Bytes.toBytes(columnFamily), Bytes.toBytes(column), Bytes.toBytes(value)); table.put(put); } // 删除一条(行)数据 public static void delRow(String tableName, String row) throws Exception { Delete del = new Delete(Bytes.toBytes(row)); table.delete(del); } // 删除多条数据 public void delMultiRows(String tableName, String[] rows) throws Exception { List<Delete> delList = new ArrayList<Delete>(); for (String row : rows) { Delete del = new Delete(Bytes.toBytes(row)); delList.add(del); } table.delete(delList); } // 获取一条数据 public void getRow(String tableName, String row) throws Exception { Get get = new Get(Bytes.toBytes(row)); Result result = table.get(get); // 输出结果,raw方法返回所有keyvalue数组 for (KeyValue rowKV : result.raw()) { System.out.print("行名:" + new String(rowKV.getRow()) + " "); System.out.print("时间戳:" + rowKV.getTimestamp() + " "); System.out.print("列族名:" + new String(rowKV.getFamily()) + " "); System.out.print("列名:" + new String(rowKV.getQualifier()) + " "); System.out.println("值:" + new String(rowKV.getValue())); } } // 获取所有数据 public void getAllRows(String tableName) throws Exception { Scan scan = new Scan(); ResultScanner results = table.getScanner(scan); // 输出结果 for (Result result : results) { for (KeyValue rowKV : result.raw()) { System.out.print("行名:" + new String(rowKV.getRow()) + " "); System.out.print("时间戳:" + rowKV.getTimestamp() + " "); System.out.print("列族名:" + new String(rowKV.getFamily()) + " "); System.out .print("列名:" + new String(rowKV.getQualifier()) + " "); System.out.println("值:" + new String(rowKV.getValue())); } } } // 主函数 public static void main(String[] args) { HBaseDBDao hb = new HBaseDBDao(); try { String tableName = "student"; hb.initHTable(tableName); // 第一步:创建数据库表:“student” String[] columnFamilys = { "info", "course" }; if(!hb.isExist(tableName)) hb.createTable(tableName, columnFamilys); // 第二步:向数据表的添加数据 // 添加第一行数据 if (hb.isExist(tableName)) { hb.addRow(tableName, "zpc", "info", "age", "20"); hb.addRow(tableName, "zpc", "info", "sex", "boy"); hb.addRow(tableName, "zpc", "course", "china", "97"); hb.addRow(tableName, "zpc", "course", "math", "128"); hb.addRow(tableName, "zpc", "course", "english", "85"); // 添加第二行数据 hb.addRow(tableName, "henjun", "info", "age", "19"); hb.addRow(tableName, "henjun", "info", "sex", "boy"); hb.addRow(tableName, "henjun", "course", "china","90"); hb.addRow(tableName, "henjun", "course", "math","120"); hb.addRow(tableName, "henjun", "course", "english","90"); // 添加第三行数据 hb.addRow(tableName, "niaopeng", "info", "age", "18"); hb.addRow(tableName, "niaopeng", "info", "sex","girl"); hb.addRow(tableName, "niaopeng", "course", "china","100"); hb.addRow(tableName, "niaopeng", "course", "math","100"); hb.addRow(tableName, "niaopeng", "course", "english","99"); // 第三步:获取一条数据 System.out.println("**************获取一条(zpc)数据*************"); hb.getRow(tableName, "zpc"); // 第四步:获取所有数据 System.out.println("**************获取所有数据***************"); hb.getAllRows(tableName); // 第五步:删除一条数据 System.out.println("************删除一条(zpc)数据************"); HBaseDBDao.delRow(tableName, "zpc"); hb.getAllRows(tableName); // 第六步:删除多条数据 System.out.println("**************删除多条数据***************"); String rows[] = new String[] { "henjun","niaopeng" }; hb.delMultiRows(tableName, rows); hb.getAllRows(tableName); // 第七步:删除数据库 System.out.println("***************删除数据库表**************"); hb.deleteTable(tableName); System.out.println("表"+tableName+"存在吗?"+hb.isExist(tableName)); } else { System.out.println(tableName + "此数据库表不存在!"); } } catch (Exception e) { e.printStackTrace(); } } }
原文:http://www.cnblogs.com/gaopeng527/p/5002349.html