0


HBase高级特性:过滤器(一)

第1关:使用过滤器查询指定行的数据

知识点

1.使用过滤器的步骤:

(1)创建过滤器:RowFilter(CompareOperator op,ByteArrayComparable rowComparator),第一个参数接收的是比较操作对象,第二个参数接收的是条件。

第一个参数有很多种取值以匹配多种场景,取值表格如下:
操作描述CompareOperator.LESS匹配小于设定值的值CompareOperator.LESS_OR_EQUAL匹配小于或等于设定值的值CompareOperator.EQUAL匹配等于设定值的值CompareOperator.NOT_EQUAL匹配与设定值不相等的值CompareOperator.GREATER_OR_EQUAL匹配大于或等于设定值的值CompareOperator.GREATER匹配大于设定值的值CompareOperator.NO_OP排除一切值
(2)设置过滤器。

编程要求

请补全函数

  1. query(String tName)

,需要你查询的数据如下,表名会作为方法的参数传入:

  • 查询basic_info列族gender列,且行键为2018的值;
  • 查询school_info列族college列,且行键大于2018的值;
  • 查询basic_info列族name列,且行键小于等于2020的值。
  1. package step1;
  2. import java.io.IOException;
  3. import org.apache.hadoop.cli.util.*;
  4. import org.apache.hadoop.conf.*;
  5. import org.apache.hadoop.hbase.*;
  6. import org.apache.hadoop.hbase.client.*;
  7. import org.apache.hadoop.hbase.filter.*;
  8. import org.apache.hadoop.hbase.util.*;
  9. public class Task {
  10. public void query(String tName) throws Exception {
  11. /********* Begin *********/
  12. Configuration config = new Configuration();
  13. Connection conn = ConnectionFactory.createConnection(config);
  14. TableName tableName = TableName.valueOf(tName);
  15. Table table = conn.getTable(tableName);
  16. Scan scan1=new Scan();
  17. scan1.addColumn(Bytes.toBytes("basic_info"), Bytes.toBytes("gender"));
  18. Filter filter1 = new RowFilter(CompareOperator.EQUAL,new BinaryComparator(Bytes.toBytes("2018")));
  19. scan1.setFilter(filter1);
  20. ResultScanner scanner1 = table.getScanner(scan1);
  21. System.out.println("row:2018");
  22. for (Result result : scanner1) {
  23. for(Cell cell : result.listCells()){
  24. System.out.println("basic_info:gender " + new String(CellUtil.cloneValue(cell),"utf-8") );
  25. }
  26. }
  27. scanner1.close();
  28. Scan scan2=new Scan();
  29. scan2.addColumn(Bytes.toBytes("school_info"), Bytes.toBytes("college"));
  30. Filter filter2 = new RowFilter(CompareOperator.GREATER,new BinaryComparator(Bytes.toBytes("2018")));
  31. scan2.setFilter(filter2);
  32. ResultScanner scanner2 = table.getScanner(scan2);
  33. for (Result result : scanner2) {
  34. System.out.println("row:" + new String(result.getRow(),"utf-8"));
  35. for(Cell cell : result.listCells()){
  36. System.out.println("school_info:college " + new String(CellUtil.cloneValue(cell),"utf-8") );
  37. }
  38. }
  39. scanner2.close();
  40. Scan scan3=new Scan();
  41. scan3.addColumn(Bytes.toBytes("basic_info"), Bytes.toBytes("name"));
  42. Filter filter3 = new RowFilter(CompareOperator.LESS_OR_EQUAL,new BinaryComparator(Bytes.toBytes("2020")));
  43. scan3.setFilter(filter3);
  44. ResultScanner scanner3 = table.getScanner(scan3);
  45. for (Result result : scanner3) {
  46. System.out.println("row:" + new String(result.getRow(),"utf-8"));
  47. for(Cell cell : result.listCells()){
  48. System.out.println("basic_info:name " + new String(CellUtil.cloneValue(cell),"utf-8") );
  49. }
  50. }
  51. scanner3.close();
  52. conn.close();
  53. /********* End *********/
  54. }
  55. }

第2关:使用正则表达式与子字符串匹配行键

知识点

比较器的子类
比较器描述BinaryComparator使用Bytes.compareTo()比较当前值与阈值BinaryPrefixComparator与上面类似,但是是从左端开始前缀匹配NullComparator不做匹配,只判断当前值是不是nullBitComparator通过BitwiseOp类提供的按位与(AND)、或(OR)、异或(XOR)操作执行位级比较RegexStringComparator(正则比较器)根据一个正则表达式,在实例化这个比较器的时候去匹配表中的数据SubStringComparator(子串过滤器)把阈值和表中数据当做String实例,同时通过contains()操作匹配字符串

编程要求

查询表

  1. t2_student_table

中的数据。 要求如下:

  • 查询以1开头,并以9结尾的行键,并输出该行所有列的值;
  • 查询包含231的行键,并输出该行所有列的值。
  1. package step2;
  2. import java.io.IOException;
  3. import org.apache.hadoop.cli.util.*;
  4. import org.apache.hadoop.conf.*;
  5. import org.apache.hadoop.hbase.*;
  6. import org.apache.hadoop.hbase.client.*;
  7. import org.apache.hadoop.hbase.filter.*;
  8. import org.apache.hadoop.hbase.util.*;
  9. import org.apache.hadoop.hbase.filter.SubstringComparator;
  10. public class Task {
  11. public void query() throws Exception {
  12. /********* Begin *********/
  13. Configuration config = new Configuration();
  14. Connection conn = ConnectionFactory.createConnection(config);
  15. TableName tablename=TableName.valueOf("t2_student_table");
  16. Table table=conn.getTable(tablename);
  17. Scan scan1=new Scan();
  18. Filter filter1 = new RowFilter(CompareOperator.EQUAL,new RegexStringComparator("1.*9$")); //查询以1开头,并以9结尾的行键
  19. scan1.setFilter(filter1);
  20. ResultScanner scanner1 = table.getScanner(scan1);
  21. for (Result result : scanner1) {
  22. System.out.println("row:" + new String(result.getRow(),"utf-8"));
  23. for(Cell cell : result.listCells()){
  24. String family = Bytes.toString(CellUtil.cloneFamily(cell));
  25. String qualifier = Bytes.toString(CellUtil.cloneQualifier(cell));
  26. String value = Bytes.toString(CellUtil.cloneValue(cell));
  27. System.out.println(family + ":" + qualifier + " " + value);
  28. }
  29. }
  30. scanner1.close();
  31. Scan scan2=new Scan();
  32. Filter filter2 = new RowFilter(CompareOperator.EQUAL,new SubstringComparator("231")); //查询包含231的行键
  33. scan2.setFilter(filter2);
  34. ResultScanner scanner2 = table.getScanner(scan2);
  35. for (Result result : scanner2) {
  36. System.out.println("row:" + new String(result.getRow(),"utf-8"));
  37. for(Cell cell : result.listCells()){
  38. String family = Bytes.toString(CellUtil.cloneFamily(cell));
  39. String qualifier = Bytes.toString(CellUtil.cloneQualifier(cell));
  40. String value = Bytes.toString(CellUtil.cloneValue(cell));
  41. System.out.println(family + ":" + qualifier + " " + value);
  42. }
  43. }
  44. scanner2.close();
  45. conn.close();
  46. /********* End *********/
  47. }
  48. }

第3关:列族过滤器、值过滤器、列名过滤器

编程要求

使用过滤器对表

  1. t3_student_table

完成如下查询操作:

  • 查询行键1019中列族school_info所有列,输出值;
  • 查询行键2020中,列名包含字母c的所有列,输出值;
  • 查询表所有行中包含的值,并输出该值。
  1. package step3;
  2. import java.io.IOException;
  3. import org.apache.hadoop.cli.util.*;
  4. import org.apache.hadoop.conf.*;
  5. import org.apache.hadoop.hbase.*;
  6. import org.apache.hadoop.hbase.client.*;
  7. import org.apache.hadoop.hbase.filter.*;
  8. import org.apache.hadoop.hbase.util.*;
  9. import org.apache.hadoop.hbase.filter.SubstringComparator;
  10. public class Task {
  11. public void query() throws Exception {
  12. /********* Begin *********/
  13. Configuration config = new Configuration();
  14. Connection conn = ConnectionFactory.createConnection(config);
  15. TableName tableName = TableName.valueOf(Bytes.toBytes("t3_student_table"));
  16. Table table = conn.getTable(tableName);
  17. Filter filter1 = new FamilyFilter(CompareOperator.EQUAL,new BinaryComparator(Bytes.toBytes("school_info"))); //列族过滤器
  18. Get get1 = new Get(Bytes.toBytes("1019"));
  19. get1.setFilter(filter1);
  20. Result result1 = table.get(get1);
  21. System.out.println("row:" + new String(result1.getRow(),"utf-8"));
  22. for(Cell cell : result1.listCells()){
  23. String family = Bytes.toString(CellUtil.cloneFamily(cell));
  24. String qualifier = Bytes.toString(CellUtil.cloneQualifier(cell));
  25. String value = Bytes.toString(CellUtil.cloneValue(cell));
  26. System.out.println(family + ":" + qualifier + " " + value);
  27. }
  28. Filter filter2 = new QualifierFilter(CompareOperator.EQUAL,
  29. new SubstringComparator("c")); //列名过滤器
  30. Get get2 = new Get(Bytes.toBytes("2020"));
  31. get2.setFilter(filter2);
  32. Result result2 = table.get(get2);
  33. System.out.println("row:" + new String(result2.getRow(),"utf-8"));
  34. for(Cell cell : result2.listCells()){
  35. String family = Bytes.toString(CellUtil.cloneFamily(cell));
  36. String qualifier = Bytes.toString(CellUtil.cloneQualifier(cell));
  37. String value = Bytes.toString(CellUtil.cloneValue(cell));
  38. System.out.println(family + ":" + qualifier + " " + value);
  39. }
  40. Scan scan3 = new Scan();
  41. Filter filter3 = new ValueFilter(CompareOperator.EQUAL, new SubstringComparator("张")); //值过滤器
  42. scan3.setFilter(filter3);
  43. ResultScanner scanner3 = table.getScanner(scan3);
  44. for (Result result : scanner3) {
  45. System.out.println("row:" + new String(result.getRow(),"utf-8"));
  46. for(Cell cell : result.listCells()){
  47. String family = Bytes.toString(CellUtil.cloneFamily(cell));
  48. String qualifier = Bytes.toString(CellUtil.cloneQualifier(cell));
  49. String value = Bytes.toString(CellUtil.cloneValue(cell));
  50. System.out.println(family + ":" + qualifier + " " + value);
  51. }
  52. }
  53. scanner3.close();
  54. conn.close();
  55. /********* End *********/
  56. }
  57. }

本文转载自: https://blog.csdn.net/m0_52680439/article/details/134362931
版权归原作者 咖啡不提神 所有, 如有侵权,请联系我们删除。

“HBase高级特性:过滤器(一)”的评论:

还没有评论