1,需求:已知空气监测数据在hbase中存储,要求按照时间,查询citycode为110000(北京)一个月的数据,数据为每日的监测数据
ID ,CITYCODE,SO2 ,CO,NO2 ,O3, PM10,PM2_5,AQI,MEASURE, TIMEPOINT
13110000020141120, 110000,31,3.939,141,8,368,301,351,6,2014-11-20
5110000020150108, 110000,53,3.305,101,12,176,143,190,4,2015-01-08
key值设计规则:
String yearMoth= "201411"; //年月
String time="20141120"; //年月日
String citycode="1100000"; //城市编码
//hbase 为20个分区,数据进入hbase的分区规则如下
int region=Math.abs((yearMoth+citycode).hashCode())%20; //结果:8
//hbase的key值为
String key =region+citycode+time;
这样设计key的好处是:同一个城市,每个月的数据的分区相同,即region相同,只需要设置startRowkey与endRowKey即可
例如 查询北京 2014 年 11 月的数据
startRowkey:13110000020141100
endRowkey: 13110000020141200 即可
但:如果查询 2014 年11 月20 号 --- 2015年01月08号的数据 则需要把每个月的数据查询出来,合并到一起
以下 为工具类的的方法:
创建 时间范围的javaBean对象
public class TimeRange {
private String startPoint ;
private String endPoint ;
public String getStartPoint() {
return startPoint;
}
public void setStartPoint(String startPoint) {
this.startPoint = startPoint;
}
public String getEndPoint() {
return endPoint;
}
public void setEndPoint(String endPoint) {
this.endPoint = endPoint;
}
public String toString() {
return startPoint + " - " + endPoint ;
}
}
计算时间范围的工具类:
startStr =20141120
endStr=20150108
得到的结果 List 为 20141120-20141201
20141201-20150101
20150101-20150108
/**
* 计算查询时间范围
*/
public static List getCallLogRanges(String startStr , String endStr){
try{
SimpleDateFormat sdfYMD = new SimpleDateFormat("yyyyMMdd");
SimpleDateFormat sdfYM = new SimpleDateFormat("yyyyMM");
DecimalFormat df00 = new DecimalFormat("00");
//
List list = new ArrayList<>();
//字符串时间
String startPrefix = startStr.substring(0, 6);
String endPrefix = endStr.substring(0, 6);
int endDay = Integer.parseInt(endStr.substring(6, 8));
//结束点
String endPoint = endPrefix + df00.format(endDay + 1);
//日历对象
Calendar c = Calendar.getInstance();
//同年月
if (startPrefix.equals(endPrefix)) {
TimeRange range = new TimeRange ();
range.setStartPoint(startStr); //设置起始点
range.setEndPoint(endPoint); //设置结束点
list.add(range);
} else {
//1.起始月
TimeRange range = new TimeRange ();
range.setStartPoint(startStr);
//设置日历的时间对象
c.setTime(sdfYMD.parse(startStr));
c.add(Calendar.MONTH, 1);
range.setEndPoint(sdfYM.format(c.getTime()));
list.add(range);
//是否是最后一月
while (true) {
//到了结束月份
if (endStr.startsWith(sdfYM.format(c.getTime()))) {
range = new TimeRange ();
range.setStartPoint(sdfYM.format(c.getTime()));
range.setEndPoint(endPoint);
list.add(range);
break;
} else {
range = new TimeRange ();
//起始时间
range.setStartPoint(sdfYM.format(c.getTime()));
//增加月份
c.add(Calendar.MONTH, 1);
range.setEndPoint(sdfYM.format(c.getTime()));
list.add(range);
}
}
}
return list ;
}
catch(Exception e){
e.printStackTrace();
}
return null ;
}
Hbase 查询的时 遍历List
public List getLogByContion(String citycode, List ranges) {
Configuration conf = HBaseConfiguration.create();
Connection conn = ConnectionFactory.createConnection(conf);
TableName tableName = TableName.valueOf("hbase:airDay");
table=conn.getTable(tableName);
List list = new ArrayList<>();
try {
for (TimeRange range: ranges) {
Scan scan = new Scan();
//设置扫描起始行 结束行
scan.setStartRow(Bytes.toBytes(HbaseUtils.getStartRowkey(citycode,range.getStartPoint())));
scan.setStopRow(Bytes.toBytes(HbaseUtils.getStopRowkey(citycode,range.getStartPoint(),range.getEndPoint())));
ResultScanner rs = table.getScanner(scan);
Iterator it = rs.iterator();
byte[] f1 = Bytes.toBytes("f1");
byte[] caller = Bytes.toBytes("citycode");
byte[] callee = Bytes.toBytes("so2");
byte[] callTime = Bytes.toBytes("co");
byte[] callDuration = Bytes.toBytes("no2");
while (it.hasNext()) {
Result r = it.next();
Map map = new HashMap();
map.put("rowkey",Bytes.toString(r.getRow()));
map.put("caller",Bytes.toString(r.getValue(f1,citycode)));
map.put("callee",Bytes.toString(r.getValue(f1,so2)));
map.put("callTime",Bytes.toString(r.getValue(f1,co)));
map.put("callDuration",Bytes.toString(r.getValue(f1,no2)));
list.add(map);
}
}
}catch (Exception e){
}
return list;
}
public static String getStartRowkey(String citycode, String time) {
int region=Math.abs((yearMoth+citycode).hashCode())%20;
return region+citycode+time;
}
public static String getStopRowkey(String citycode,String starttime, String endtime) {
int region=Math.abs((yearMoth+citycode).hashCode())%20;
return region+citycode+endtime;
}