[root@cdh4 scripts]# parquet-tools meta hdfs://cdh3.macro.com:8020/user/hive/warehouse/iot_test.db/hive_table_parquet/subdir=10/000000_0 creator: parquet-mr version 1.5.0-cdh5.13.1 (build ${buildNumber}) file schema: hive_schema
并发测试脚本准备
脚本
# Impala负载均衡地址为:cdh4.macro.com:25003 [root@cdh4 scripts]# cat impala-test.sh #!/bin/sh#Concurrency test let i=1 while [ $i -le $1 ]; doimpala-shell -B -i cdh4.macro.com:25003 -u hive -f $2 -o log/${i}.out &let i=i+1 done wait
SQL测试
SELECT nvl(A.TOTALGPRSUSEDFLOW,0) as TOTALGPRSUSEDFLOW, nvl(A.TOTALSMSUSEDFLOW,0) as TOTALSMSUSEDFLOW, B.USEDDATE AS USEDDATE FROM ( SELECT SUM(GPRSUSEDFLOW) AS TOTALGPRSUSEDFLOW, SUM(SMSUSEDFLOW) AS TOTALSMSUSEDFLOW, cast(STATSDATE as timestamp) AS USEDDATE FROM hive_table_parquet SIMFLOW WHERE SIMFLOW.subdir = '10' AND SIMFLOW.CUSTID = '10099' AND cast(SIMFLOW.STATSDATE as timestamp) >= to_date(date_sub(current_timestamp(),7)) AND cast(SIMFLOW.STATSDATE as timestamp) RIGHT JOIN ( SELECT to_date(date_sub(current_timestamp(),7)) AS USEDDATE UNION ALLSELECT to_date(date_sub(current_timestamp(),1)) AS USEDDATE UNION ALLSELECT to_date(date_sub(current_timestamp(),2)) AS USEDDATE UNION ALLSELECT to_date(date_sub(current_timestamp(),3)) AS USEDDATE UNION ALLSELECT to_date(date_sub(current_timestamp(),4)) AS USEDDATE UNION ALLSELECT to_date(date_sub(current_timestamp(),5)) AS USEDDATE UNION ALLSELECT to_date(date_sub(current_timestamp(),6)) AS USEDDATE ) B on to_date(A.USEDDATE) = to_date(B.USEDDATE) ORDER BY B.USEDDATE