hbase api常用方法使用及預分割槽解決熱點問題

阿新 • • 發佈：2019-02-16

API 操作：

import java.io.IOException;
import java.util.ArrayList;
import java.util.List;

import org.apache.hadoop.conf.Configuration;
import org.apache.hadoop.hbase.HBaseConfiguration;
import org.apache.hadoop.hbase.HColumnDescriptor;
import org.apache.hadoop.hbase.HTableDescriptor;
import org.apache.hadoop.hbase.KeyValue;
import org.apache.hadoop.hbase.MasterNotRunningException;
import org.apache.hadoop.hbase.TableName;
import org.apache.hadoop.hbase.ZooKeeperConnectionException;
import org.apache.hadoop.hbase.client.Get;
import org.apache.hadoop.hbase.client.HBaseAdmin;
import org.apache.hadoop.hbase.client.HTable;
import org.apache.hadoop.hbase.client.HTablePool;
import org.apache.hadoop.hbase.client.Put;
import org.apache.hadoop.hbase.client.Result;
import org.apache.hadoop.hbase.client.ResultScanner;
import org.apache.hadoop.hbase.client.Scan;
import org.apache.hadoop.hbase.filter.CompareFilter.CompareOp;
import org.apache.hadoop.hbase.filter.Filter;
import org.apache.hadoop.hbase.filter.FilterList;
import org.apache.hadoop.hbase.filter.PrefixFilter;
import org.apache.hadoop.hbase.filter.SingleColumnValueFilter;
import org.apache.hadoop.hbase.util.Bytes;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;

import com.kktest.hbase.HashChoreWoker;
import com.kktest.hbase.HashRowKeyGenerator;
import com.kktest.hbase.RowKeyGenerator;
import com.kktest.hbase.BitUtils;

/**
 * hbase 客戶端
 * 
 * @author kuang hj
 * 
 */
@SuppressWarnings("all")
public class HBaseClient {

    private static Logger logger = LoggerFactory.getLogger(HBaseClient.class);
    private static Configuration config;
    static {
        config = HBaseConfiguration.create();
        config.set("hbase.zookeeper.quorum",
                "192.168.1.100:2181,192.168.1.101:2181,192.168.1.103:2181");
    }

    /**
     * 根據隨機雜湊（hash）建立分割槽表
     * 
     * @throws Exception
     *             hash_split_table
     */
    public static void testHashAndCreateTable(String tableNameTmp,
            String columnFamily) throws Exception {<p>        // 取隨機雜湊 10 代表 10個分割槽
        HashChoreWoker worker = new HashChoreWoker(1000000, 10);
        byte[][] splitKeys = worker.calcSplitKeys();

        HBaseAdmin admin = new HBaseAdmin(config);
        TableName tableName = TableName.valueOf(tableNameTmp);

        if (admin.tableExists(tableName)) {
            try {
                admin.disableTable(tableName);
            } catch (Exception e) {
            }
            admin.deleteTable(tableName);
        }

        HTableDescriptor tableDesc = new HTableDescriptor(tableName);
        HColumnDescriptor columnDesc = new HColumnDescriptor(
                Bytes.toBytes(columnFamily));
        columnDesc.setMaxVersions(1);
        tableDesc.addFamily(columnDesc);

        admin.createTable(tableDesc, splitKeys);

        admin.close();
    }

    /**
     * @Title: queryData
     * @Description: 從HBase查詢出資料
     * @author kuang hj
     * @param tableName
     *            表名
     * @param rowkey
     *            rowkey
     * @return 返回使用者資訊的list
     * @throws Exception
     */
    @SuppressWarnings("all")
    public static ArrayList<String> queryData(String tableName, String rowkey)
            throws Exception {
        ArrayList<String> list = new ArrayList<String>();
        logger.info("開始時間");
        HTable table = new HTable(config, tableName);

        Get get = new Get(rowkey.getBytes()); // 根據主鍵查詢
        Result r = table.get(get);
        logger.info("結束時間");
        KeyValue[] kv = r.raw();
        for (int i = 0; i < kv.length; i++) {
            // 迴圈每一列
            String key = kv[i].getKeyString();
            
            String value = kv[i].getValueArray().toString();
            
            // 將查詢到的結果寫入List中
            list.add(key + ":"+ value);
            
        }// end of 遍歷每一列
        
        return list;
    }

    /**
     * 增加表資料
     * 
     * @param tableName
     * @param rowkey
     */
    public static void insertData(String tableName, String rowkey) {
        HTable table = null;
        try {
            table = new HTable(config, tableName);
            // 一個PUT代表一行資料，再NEW一個PUT表示第二行資料,每行一個唯一的ROWKEY，此處rowkey為put構造方法中傳入的值
            for (int i = 1; i < 100; i++) {
                byte[] result = getNumRowkey(rowkey,i);
                Put put = new Put(result);
                // 本行資料的第一列
                put.add(rowkey.getBytes(), "name".getBytes(),
                        ("aaa" + i).getBytes());
                // 本行資料的第三列
                put.add(rowkey.getBytes(), "age".getBytes(),
                        ("bbb" + i).getBytes());
                // 本行資料的第三列
                put.add(rowkey.getBytes(), "address".getBytes(),
                        ("ccc" + i).getBytes());

                table.put(put);
            }

        } catch (Exception e1) {
            e1.printStackTrace();
        }
    }

    private static byte[] getNewRowkey(String rowkey) {
        byte[] result = null;

        RowKeyGenerator rkGen = new HashRowKeyGenerator();
        byte[] splitKeys = rkGen.nextId();

        byte[] rowkeytmp = rowkey.getBytes();

        result = new byte[splitKeys.length + rowkeytmp.length];
        System.arraycopy(splitKeys, 0, result, 0, splitKeys.length);
        System.arraycopy(rowkeytmp, 0, result, splitKeys.length,
                rowkeytmp.length);

        return result;
    }
    
    public static void main(String[] args) {
        RowKeyGenerator rkGen = new HashRowKeyGenerator();
        byte[] splitKeys = rkGen.nextId();
        System.out.println(splitKeys);    
    }

    private static byte[] getNumRowkey(String rowkey, int i) {
        byte[] result = null;

        RowKeyGenerator rkGen = new HashRowKeyGenerator();
        byte[] splitKeys = rkGen.nextId();

        byte[] rowkeytmp = rowkey.getBytes();

        byte[] intVal = BitUtils.getByteByInt(i);
        result = new byte[splitKeys.length + rowkeytmp.length + intVal.length];
        System.arraycopy(splitKeys, 0, result, 0, splitKeys.length);
        System.arraycopy(rowkeytmp, 0, result, splitKeys.length,
                rowkeytmp.length);
        System.arraycopy(intVal, 0, result, splitKeys.length+rowkeytmp.length,
                intVal.length);

        return result;
    }
    
    

    /**
     * 刪除表
     * 
     * @param tableName
     */
    public static void dropTable(String tableName) {
        try {
            HBaseAdmin admin = new HBaseAdmin(config);
            admin.disableTable(tableName);
            admin.deleteTable(tableName);
        } catch (MasterNotRunningException e) {
            e.printStackTrace();
        } catch (ZooKeeperConnectionException e) {
            e.printStackTrace();
        } catch (IOException e) {
            e.printStackTrace();
        }
    }

    /**
     * 查詢所有
     * 
     * @param tableName
     */
    public static void QueryAll(String tableName) {
        HTable table  = null;
        try {
            table  = new HTable(config, tableName);
            ResultScanner rs = table.getScanner(new Scan());
            for (Result r : rs) {
                System.out.println("獲得到rowkey:" + new String(r.getRow()));
                for (KeyValue keyValue : r.raw()) {
                    System.out.println("列：" + new String(keyValue.getFamily())
                            + "====值:" + new String(keyValue.getValue()));
                }
            }
        } catch (IOException e) {
            e.printStackTrace();
        }
    }

    /**
     * 查詢所有
     * 
     * @param tableName
     */
    public static void QueryByCondition1(String tableName) {

        HTable table = null;
        try {
            table  = new HTable(config, tableName);
            Get scan = new Get("abcdef".getBytes());// 根據rowkey查詢
            Result r = table.get(scan);
            System.out.println("獲得到rowkey:" + new String(r.getRow()));
            for (KeyValue keyValue : r.raw()) {
                System.out.println("列：" + new String(keyValue.getFamily())
                        + "====值:" + new String(keyValue.getValue()));
            }
        } catch (IOException e) {
            e.printStackTrace();
        }
    }
    
    /**
     *  根據rowkwy前墜查詢 
     * @param tableName
     * @param rowkey
     */
    public static void queryByRowKey(String tableName,String rowkey)
    {
        try {
            HTable table = new HTable(config, tableName);
            Scan scan = new Scan();
            scan.setFilter(new PrefixFilter(rowkey.getBytes()));
            ResultScanner rs = table.getScanner(scan);
            KeyValue[] kvs = null;
            for (Result tmp : rs)
            {
                kvs = tmp.raw();
                for (KeyValue kv : kvs)
                {
                    System.out.print(kv.getRow()+" ");
                    System.out.print(kv.getFamily()+" :");
                    System.out.print(kv.getQualifier()+" ");
                    System.out.print(kv.getTimestamp()+" ");
                    System.out.println(kv.getValue());
                }
            }
        } catch (IOException e) {
            e.printStackTrace();
        }
        
    }
    /**
     * 查詢所有
     * 
     * @param tableName
     */
    public static void QueryByCondition2(String tableName) {

        try {
            HTable table = new HTable(config, tableName);
            // 當列column1的值為aaa時進行查詢
            Filter filter = new SingleColumnValueFilter(
                    Bytes.toBytes("column1"), null, CompareOp.EQUAL,
                    Bytes.toBytes("aaa")); 
            Scan s = new Scan();
            s.setFilter(filter);
            ResultScanner rs = table.getScanner(s);
            for (Result r : rs) {
                System.out.println("獲得到rowkey:" + new String(r.getRow()));
                for (KeyValue keyValue : r.raw()) {
                    System.out.println("列：" + new String(keyValue.getFamily())
                            + "====值:" + new String(keyValue.getValue()));
                }
            }
        } catch (Exception e) {
            e.printStackTrace();
        }

    }

    /**
     * 查詢所有
     * 
     * @param tableName
     */
    public static void QueryByCondition3(String tableName) {

        try {
            
            HTable table = new HTable(config, tableName);

            List<Filter> filters = new ArrayList<Filter>();

            Filter filter1 = new SingleColumnValueFilter(
                    Bytes.toBytes("column1"), null, CompareOp.EQUAL,
                    Bytes.toBytes("aaa"));
            filters.add(filter1);

            Filter filter2 = new SingleColumnValueFilter(
                    Bytes.toBytes("column2"), null, CompareOp.EQUAL,
                    Bytes.toBytes("bbb"));
            filters.add(filter2);

            Filter filter3 = new SingleColumnValueFilter(
                    Bytes.toBytes("column3"), null, CompareOp.EQUAL,
                    Bytes.toBytes("ccc"));
            filters.add(filter3);

            FilterList filterList1 = new FilterList(filters);

            Scan scan = new Scan();
            scan.setFilter(filterList1);
            ResultScanner rs = table.getScanner(scan);
            for (Result r : rs) {
                System.out.println("獲得到rowkey:" + new String(r.getRow()));
                for (KeyValue keyValue : r.raw()) {
                    System.out.println("列：" + new String(keyValue.getFamily())
                            + "====值:" + new String(keyValue.getValue()));
                }
            }
            rs.close();

        } catch (Exception e) {
            e.printStackTrace();
        }

    }
}</p>

HashChoreWoker：

import java.util.Iterator;
import java.util.TreeSet;

import org.apache.hadoop.hbase.util.Bytes;

/**
 * 
 * @author kuang hj
 *
 */
public class HashChoreWoker{
    // 隨機取機數目
    private int baseRecord;
    // rowkey生成器
    private RowKeyGenerator rkGen;
    // 取樣時，由取樣數目及region數相除所得的數量.
    private int splitKeysBase;
    // splitkeys個數
    private int splitKeysNumber;
    // 由抽樣計算出來的splitkeys結果
    private byte[][] splitKeys;

    public HashChoreWoker(int baseRecord, int prepareRegions) {
        this.baseRecord = baseRecord;
        // 例項化rowkey生成器
        rkGen = new HashRowKeyGenerator();
        splitKeysNumber = prepareRegions - 1;
        splitKeysBase = baseRecord / prepareRegions;
    }

    public byte[][] calcSplitKeys() {
        splitKeys = new byte[splitKeysNumber][];
        // 使用treeset儲存抽樣資料，已排序過
        TreeSet<byte[]> rows = new TreeSet<byte[]>(Bytes.BYTES_COMPARATOR);
        for (int i = 0; i < baseRecord; i++) {
            rows.add(rkGen.nextId());
        }
        int pointer = 0;
        Iterator<byte[]> rowKeyIter = rows.iterator();
        int index = 0;
        while (rowKeyIter.hasNext()) {
            byte[] tempRow = rowKeyIter.next();
            rowKeyIter.remove();
            if ((pointer != 0) && (pointer % splitKeysBase == 0)) {
                if (index < splitKeysNumber) {
                    splitKeys[index] = tempRow;
                    index++;
                }
            }
            pointer++;
        }
        rows.clear();
        rows = null;
        return splitKeys;
    }
}

HashRowKeyGenerator：
import org.apache.hadoop.hbase.util.Bytes;
import org.apache.hadoop.hbase.util.MD5Hash;

import com.kktest.hbase.BitUtils;
/**
*
*
**/
public class HashRowKeyGenerator implements RowKeyGenerator {
    private static long currentId = 1;
    private static long currentTime = System.currentTimeMillis();
    //private static Random random = new Random();

    public byte[] nextId() 
    {
        try {
            currentTime = getRowKeyResult(Long.MAX_VALUE - currentTime);
            byte[] lowT = Bytes.copy(Bytes.toBytes(currentTime), 4, 4);
            byte[] lowU = Bytes.copy(Bytes.toBytes(currentId), 4, 4);
            byte[] result = Bytes.add(MD5Hash.getMD5AsHex(Bytes.add(lowT, lowU))
                    .substring(0, 8).getBytes(), Bytes.toBytes(currentId));
            return result;
        } finally {
            currentId++;
        }
    }
    
    /**
     *  getRowKeyResult
     * @param tmpData
     * @return
     */
    public static long getRowKeyResult(long tmpData)
    {
        String str = String.valueOf(tmpData);
        StringBuffer sb = new StringBuffer();
        char[] charStr = str.toCharArray();
        for (int i = charStr.length -1 ; i > 0; i--)
        {
            sb.append(charStr[i]);
        }
        
        return Long.parseLong(sb.toString());
    }
}

</pre><pre name="code" class="java">

hbase api常用方法使用及預分割槽解決熱點問題

API 操作：import java.io.IOException; import java.util.ArrayList; import java.util.List; import org.apache.hadoop.conf.Configuration; impor

Hbase叢集安裝配置及常見問題解決方法

Hbase介紹 HBASE是一個高可靠性、高效能、面向列、可伸縮的分散式儲存系統，利用HBASE技術可在廉價PC Server上搭建起大規模結構化儲存叢集。 HBASE的目標是儲存並處理大型的資料，更具體來說是僅需使用普通的硬體配置，就能夠處理由成千上萬的行和列所組成的大型

無法開啟預編譯標頭檔案的解決方法及預編譯頭原理[ZZ]

1。用VC.NET編輯程式，按Ctrl+F7,出現下列錯誤： fatal error C1083: 無法開啟預編譯標頭檔案：“Debug/UGFace.pch”: No such file or directory 解決方法：修改：專案->屬性->C/C

error無法開啟預編譯標頭檔案的解決方法及預編譯頭原理

1。用VC.NET編輯程式，按Ctrl+F7,出現下列錯誤： fatal error C1083: 無法開啟預編譯標頭檔案：“Debug/UGFace.pch”: No such file or directory 解決方法：修改：專案->屬性->C/C++

Java File類常用方法及實例

獲取而且 exist exc file類註釋 sys 遞歸遍歷 cep 創建：createNewFile()在指定位置創建一個空文件，成功就返回true，如果已存在就不創建，然後返回false。mkdir() 在指定位置創建一個單級文件夾。mkdirs() 在指定位

Selenium API常用方法

取消 bmi ren out 清除 ble itl att css driver.findElements()//定位一組List元素集合 driver.findElement()//定位一個元素 driver.getTitle()//獲取頁面標題 driver.get()

js數組string對象api常用方法

位置字符串數組 tor body object split script 常用 bst charAt() 方法可返回指定位置的字符。 stringObject.charAt(index) indexOf() 方法可返回某個指定的字符串值在字符串中首次出現的

【監控】Jprofiler監控tomcat的配置方法及報錯解決過程

could CA 監聽端口 arch https img .net http 沒有準備工作： 1.Jprofiler for Linux安裝包一個（服務端） 2.Jprofiler for windows安裝包一個（客戶端） 3.各自安裝、解壓 Linux：/opt/jp

35 並行/發同/異步非/ 阻塞進程的兩種開啟方式, 進程的常用方法及屬性

self 屬性任務序列設置並行告訴方法 main 解釋器主要內容: 1 名詞解釋並行 : 即兩件事情或多件事情,在同一時間點同時執行.是從微觀上，也就是在一個精確的時間片刻，有不同的程序在執行，這就要求必須有多個處理器並發 : 即兩件事情或多件事情在

Java面向對象-- String 類常用方法及基本使用

for str news http clas substr 實例 div print 首先來學習基本使用Jdk api chm文檔：點擊左上角-顯示： 1, char chartAt(int index) 返回指定索引處的char值這裏的index 是從0

Java面向物件-- String 類常用方法及基本使用

首先來學習基本使用Jdk api chm文件：點選左上角-顯示： 1, char chartAt(int index) 返回指定索引處的char值這裡的index 是從0開始的； package com.xuyigang1234.chp02.strin

JAVA高階基礎（11）---Map的常用方法及遍歷方式

Map 注：更多詳細方法請查詢 API Map介面和Collection介面的不同 Map是雙列的,Collection是單列的 Map的鍵唯一,Collection的子體系Set是唯一的 Map集合的資料結構值針對鍵有效，跟值無關；Collection

同義詞挖掘的一些常用方法及同義詞替換程式

先談談同義詞挖掘的一些常用方法在使用者使用搜索引擎的過程中，由於地區差異、文化水平等差異，使用者所輸入的query很多時候和資料中的描述不一致。這種情況下，為了能夠召回更多的文件向用戶展示，搜尋引擎需要對使用者的輸入做同義詞、糾錯、歸一化等操作。在進行這些操作的過程中，

GCD常用方法及應用場景

開發過程中，出現耗時操作造成介面卡頓是常見的問題之一，問題原因就是因為耗時操作阻塞了主執行緒，所以要解決這類問題最簡單的就是引進子執行緒，將耗時操作移出主執行緒，耗時操作完成後回到主執行緒中更新UI。之前在做一個通訊錄的時候，由於需要自己進行排序，所以第一次時需要將幾千條的資料都拉下

Eclipse 常用技巧及常見問題解決

Eclipse默許函式摺疊開啟之前更新了eclipse的一些外掛之後,每次開啟程式碼eclipse 預設把程式碼裡面的函式程式碼和註釋,import 內容都給摺疊了,雖然看起來精簡了,但是有些不方便,要一個個點開. 於是查了一下關於摺疊的方法的配置. win

Hbase API核心流程及程式碼

核心流程獲取配置物件為該物件指定hbase的叢集通過配置物件建立連線通過連接獲取管理員物件通過管理員物件對錶進行操作關閉連線程式碼 public class HBase_API { public static void main(Strin

String 物件常用方法及屬性詳細介紹

String物件的屬性：　　1、constructor ：對建立該物件的函式的引用　　2、length ：字串長度　　3、prototype ：允許您向物件新增屬性和方法 String物件的方法：　　1、charAt() 方法可返回指定位置的

一種攔截Linux動態庫API的方法及裝置

描述攔截Linux動態庫API的常規方法，是基於動態符號連結覆蓋技術實現的，基本步驟是 1. 重新命名要攔截的目標動態庫。 2. 建立新的同名動態庫，定義要攔截的同名API，在API內部呼叫原動態庫對應的API。這裡的同名是指與重新命名前動態庫前的名稱相同。顯而易見

request常用方法及應用

request常用方法獲得客戶機資訊 getRequestURL方法返回客戶端發出請求時的完整URL。 getRequestURI方法返回請求行中的資源名部分。 getQueryString 方法返回請求行中的引數部分。 getRemoteAddr方法返回發出請求

java中Request和Response常用方法及舉例

Request的常用方法: setAttribute() 在Request域中儲存資料 setCharacterEncoding() 設定請求引

hbase api常用方法使用及預分割槽解決熱點問題

相關推薦