Apache Phoenix Performance Result :: Thu Sep 25 11:08:38 PDT 2014

Test Suite: STANDARD

Queries by Category



Aggregation

select count(*) from AGGREGATION_TABLE
0.66s V4.1.0-HBASE-0.98.1-HADOOP1
0.58s 4.0-HBASE-0.98.1-HADOOP1

select count(1) from AGGREGATION_TABLE group by HOST
0.67s V4.1.0-HBASE-0.98.1-HADOOP1
0.58s 4.0-HBASE-0.98.1-HADOOP1

select core, count(1) from AGGREGATION_TABLE group by CORE
0.8s V4.1.0-HBASE-0.98.1-HADOOP1
0.76s 4.0-HBASE-0.98.1-HADOOP1

select core, host, sum(ACTIVE_VISITOR) from AGGREGATION_TABLE group by core, host
3.35s V4.1.0-HBASE-0.98.1-HADOOP1
3.25s 4.0-HBASE-0.98.1-HADOOP1

select AVG(DB), MIN(CORE), MAX(ACTIVE_VISITOR) from AGGREGATION_TABLE where host='CS' and DOMAIN<>'Google.com'
3.99s V4.1.0-HBASE-0.98.1-HADOOP1
4.03s 4.0-HBASE-0.98.1-HADOOP1

select round(date, 'day',50), sum(core)+2 from AGGREGATION_TABLE where (CORE<10 or CORE>90) group by round(date, 'day',50), host
1.35s V4.1.0-HBASE-0.98.1-HADOOP1
1.27s 4.0-HBASE-0.98.1-HADOOP1

select trunc(date, 'hour', 1000), count(DB), count(ACTIVE_VISITOR) from AGGREGATION_TABLE where feature='Login' and (core<50 or db<20 or active_visitor > 200) group by trunc(date, 'hour', 1000)
2.79s V4.1.0-HBASE-0.98.1-HADOOP1
2.66s 4.0-HBASE-0.98.1-HADOOP1

select count(active_visitor) count from AGGREGATION_TABLE
2.94s V4.1.0-HBASE-0.98.1-HADOOP1
2.78s 4.0-HBASE-0.98.1-HADOOP1

select count(distinct active_visitor) count from AGGREGATION_TABLE
3.32s V4.1.0-HBASE-0.98.1-HADOOP1
3.09s 4.0-HBASE-0.98.1-HADOOP1

select count(core), count(db), count(active_visitor) from AGGREGATION_TABLE
3.87s V4.1.0-HBASE-0.98.1-HADOOP1
3.68s 4.0-HBASE-0.98.1-HADOOP1

select core, count(db) count from AGGREGATION_TABLE group by CORE
0.84s V4.1.0-HBASE-0.98.1-HADOOP1
0.74s 4.0-HBASE-0.98.1-HADOOP1

select count(core) from AGGREGATION_TABLE where core < 10 and db < 200
1.34s V4.1.0-HBASE-0.98.1-HADOOP1
1.22s 4.0-HBASE-0.98.1-HADOOP1

select count(core) from AGGREGATION_TABLE where core < 10 and active_visitor < 1000
2.37s V4.1.0-HBASE-0.98.1-HADOOP1
2.19s 4.0-HBASE-0.98.1-HADOOP1

select count(core) from AGGREGATION_TABLE where core > 90
1.19s V4.1.0-HBASE-0.98.1-HADOOP1
1.09s 4.0-HBASE-0.98.1-HADOOP1

select count(*) from WIDE_PK
2.9s V4.1.0-HBASE-0.98.1-HADOOP1
2.65s 4.0-HBASE-0.98.1-HADOOP1


Aggregation with filter no non-pk

select count(*) from TABLE_6CF where f < 10000
3.17s V4.1.0-HBASE-0.98.1-HADOOP1
2.96s 4.0-HBASE-0.98.1-HADOOP1

select count(*) from TABLE_1CF where f < 10000
2.34s V4.1.0-HBASE-0.98.1-HADOOP1
2.16s 4.0-HBASE-0.98.1-HADOOP1

select count(*) from WIDE_PK where column2<10
3.1s V4.1.0-HBASE-0.98.1-HADOOP1
2.85s 4.0-HBASE-0.98.1-HADOOP1

select count(*) from WIDE_PK where column2<50 and column3<50 and column4<50 and column5<50
3.71s V4.1.0-HBASE-0.98.1-HADOOP1
3.62s 4.0-HBASE-0.98.1-HADOOP1


ColumnFamilies-Single

select count(1) from TABLE_6CF where K1 in ('A', 'B', 'C', 'D')
1.02s V4.1.0-HBASE-0.98.1-HADOOP1
0.94s 4.0-HBASE-0.98.1-HADOOP1

select count(1) from TABLE_6CF where K1 in ('A', 'C')
0.78s V4.1.0-HBASE-0.98.1-HADOOP1
0.75s 4.0-HBASE-0.98.1-HADOOP1

select count(*) from TABLE_6CF where f < 1000
1.69s V4.1.0-HBASE-0.98.1-HADOOP1
1.6s 4.0-HBASE-0.98.1-HADOOP1

select a,b,c,d,e,f from TABLE_6CF where B>1000 and B<2000 and f>1000 and f<2000
2.58s V4.1.0-HBASE-0.98.1-HADOOP1
2.44s 4.0-HBASE-0.98.1-HADOOP1

select sum(a),sum(b),sum(c),sum(d) from TABLE_6CF group by K1
6.22s V4.1.0-HBASE-0.98.1-HADOOP1
5.95s 4.0-HBASE-0.98.1-HADOOP1

select count(1) from TABLE_1CF where K1 in ('A', 'B', 'C', 'D')
2.34s V4.1.0-HBASE-0.98.1-HADOOP1
2.12s 4.0-HBASE-0.98.1-HADOOP1

select count(1) from TABLE_1CF where K1 in ('A', 'C')
2.04s V4.1.0-HBASE-0.98.1-HADOOP1
1.83s 4.0-HBASE-0.98.1-HADOOP1

select count(*) from TABLE_1CF where f < 1000
2.5s V4.1.0-HBASE-0.98.1-HADOOP1
2.3s 4.0-HBASE-0.98.1-HADOOP1

select a,b,c,d,e,f from TABLE_1CF where B>1000 and B<2000 and f>1000 and f<2000
3.33s V4.1.0-HBASE-0.98.1-HADOOP1
3.1s 4.0-HBASE-0.98.1-HADOOP1

select sum(a),sum(b),sum(c),sum(d) from TABLE_1CF group by K1
2.68s V4.1.0-HBASE-0.98.1-HADOOP1
2.33s 4.0-HBASE-0.98.1-HADOOP1


Count Distinct

select count(distinct core), count(distinct db), count(distinct active_visitor) from AGGREGATION_TABLE
4.5s V4.1.0-HBASE-0.98.1-HADOOP1
4.35s 4.0-HBASE-0.98.1-HADOOP1

select core, count(distinct db) count from AGGREGATION_TABLE group by CORE
2.07s V4.1.0-HBASE-0.98.1-HADOOP1
1.92s 4.0-HBASE-0.98.1-HADOOP1


IN/LIKE Clause

select count(core) from AGGREGATION_TABLE where core IN (1,25,50,75,100)
1.15s V4.1.0-HBASE-0.98.1-HADOOP1
1.06s 4.0-HBASE-0.98.1-HADOOP1

select count(1) from IN_LIKE_TABLE where K1 in ('Z', 'D', 'F', 'X')
0.88s V4.1.0-HBASE-0.98.1-HADOOP1
0.81s 4.0-HBASE-0.98.1-HADOOP1

select * from IN_LIKE_TABLE where K1 in ('A','B') and K2 in ('xxx1000000','xxx2000000','xxx2000001')
0.01s V4.1.0-HBASE-0.98.1-HADOOP1
0.01s 4.0-HBASE-0.98.1-HADOOP1

select * from IN_LIKE_TABLE where K1 in ('A', 'C', 'E', 'F', 'H') and K2 like 'xxxxxx1%'
0.03s V4.1.0-HBASE-0.98.1-HADOOP1
0.03s 4.0-HBASE-0.98.1-HADOOP1

select count(*) from IN_LIKE_TABLE where K1 in ('X','A','B','C','D','E','F','G','H','I','Z') and K2 like '%1%'
278.34s V4.1.0-HBASE-0.98.1-HADOOP1
132.81s 4.0-HBASE-0.98.1-HADOOP1

select count(*) from IN_LIKE_TABLE where (K1 in ('A','E','F','G','H','I','Z') or K1 like 'E%') and (K2 like '%xx1%' or K2 like '%xxxxxx2%')
125.66s V4.1.0-HBASE-0.98.1-HADOOP1
60.88s 4.0-HBASE-0.98.1-HADOOP1


Index

select count(*) from INDEXED_TABLE
1.02s V4.1.0-HBASE-0.98.1-HADOOP1
0.78s 4.0-HBASE-0.98.1-HADOOP1

select /*+ INDEX(INDEXED_TABLE idx1 idx2 idx3 idx4) */ count(*) from INDEXED_TABLE
1.21s V4.1.0-HBASE-0.98.1-HADOOP1
1.11s 4.0-HBASE-0.98.1-HADOOP1

select /*+ INDEX(INDEXED_TABLE ids1 ids2 ids3 ids4) */ count(*) from INDEXED_TABLE
0.4s V4.1.0-HBASE-0.98.1-HADOOP1
0.38s 4.0-HBASE-0.98.1-HADOOP1

select /*+NO_INDEX*/ count(*) from INDEXED_TABLE
1.35s V4.1.0-HBASE-0.98.1-HADOOP1
1.16s 4.0-HBASE-0.98.1-HADOOP1

select round(date, 'day',50), sum(core)+2 from INDEXED_TABLE where (CORE<10 or CORE>90) group by round(date, 'day',50), host
0.61s V4.1.0-HBASE-0.98.1-HADOOP1
0.63s 4.0-HBASE-0.98.1-HADOOP1

select /*+NO_INDEX*/ round(date, 'day',50), sum(core)+2 from INDEXED_TABLE where (CORE<10 or CORE>90) group by round(date, 'day',50), host
1.95s V4.1.0-HBASE-0.98.1-HADOOP1
2.05s 4.0-HBASE-0.98.1-HADOOP1

select count(core) from INDEXED_TABLE where core IN (1,100)
0.07s V4.1.0-HBASE-0.98.1-HADOOP1
0.06s 4.0-HBASE-0.98.1-HADOOP1

select /*+ INDEX(INDEXED_TABLE idx1 idx2 idx3 idx4) */ count(core) from INDEXED_TABLE where core IN (1,100)
0.05s V4.1.0-HBASE-0.98.1-HADOOP1
0.05s 4.0-HBASE-0.98.1-HADOOP1

select /*+ INDEX(INDEXED_TABLE ids1 ids2 ids3 ids4) */ count(core) from INDEXED_TABLE where core IN (1,100)
0.09s V4.1.0-HBASE-0.98.1-HADOOP1
0.06s 4.0-HBASE-0.98.1-HADOOP1

select /*+NO_INDEX*/ count(core) from INDEXED_TABLE where core IN (1,100)
1.65s V4.1.0-HBASE-0.98.1-HADOOP1
1.66s 4.0-HBASE-0.98.1-HADOOP1

select count(core) from INDEXED_TABLE where core IN (1,25,50,75,100)
0.15s V4.1.0-HBASE-0.98.1-HADOOP1
0.11s 4.0-HBASE-0.98.1-HADOOP1

select /*+ INDEX(INDEXED_TABLE idx1 idx2 idx3 idx4) */ count(core) from INDEXED_TABLE where core IN (1,25,50,75,100)
0.11s V4.1.0-HBASE-0.98.1-HADOOP1
0.13s 4.0-HBASE-0.98.1-HADOOP1

select /*+ INDEX(INDEXED_TABLE ids1 ids2 ids3 ids4) */ count(core) from INDEXED_TABLE where core IN (1,25,50,75,100)
0.11s V4.1.0-HBASE-0.98.1-HADOOP1
0.11s 4.0-HBASE-0.98.1-HADOOP1

select /*+NO_INDEX*/ count(core) from INDEXED_TABLE where core IN (1,25,50,75,100)
1.7s V4.1.0-HBASE-0.98.1-HADOOP1
1.68s 4.0-HBASE-0.98.1-HADOOP1

select count(core) from INDEXED_TABLE where core < 10 and db < 200
0.7s V4.1.0-HBASE-0.98.1-HADOOP1
0.7s 4.0-HBASE-0.98.1-HADOOP1

select /*+ INDEX(INDEXED_TABLE idx1 idx2 idx3 idx4) */ count(core) from INDEXED_TABLE where core < 10 and db < 200
0.69s V4.1.0-HBASE-0.98.1-HADOOP1
0.7s 4.0-HBASE-0.98.1-HADOOP1

select /*+ INDEX(INDEXED_TABLE ids1 ids2 ids3 ids4) */ count(core) from INDEXED_TABLE where core < 10 and db < 200
0.22s V4.1.0-HBASE-0.98.1-HADOOP1
0.23s 4.0-HBASE-0.98.1-HADOOP1

select /*+NO_INDEX*/ count(core) from INDEXED_TABLE where core < 10 and db < 200
1.97s V4.1.0-HBASE-0.98.1-HADOOP1
1.94s 4.0-HBASE-0.98.1-HADOOP1

select count(core) from INDEXED_TABLE where core < 100 and db < 2000
1.83s V4.1.0-HBASE-0.98.1-HADOOP1
1.42s 4.0-HBASE-0.98.1-HADOOP1

select /*+NO_INDEX*/ count(core) from INDEXED_TABLE where core < 100 and db < 2000
2.01s V4.1.0-HBASE-0.98.1-HADOOP1
1.99s 4.0-HBASE-0.98.1-HADOOP1

select count(core) from INDEXED_TABLE where core > 90
0.16s V4.1.0-HBASE-0.98.1-HADOOP1
0.25s 4.0-HBASE-0.98.1-HADOOP1

select /*+NO_INDEX*/ count(core) from INDEXED_TABLE where core > 90
1.76s V4.1.0-HBASE-0.98.1-HADOOP1
1.71s 4.0-HBASE-0.98.1-HADOOP1

select count(core) from INDEXED_TABLE where core > 0
1.26s V4.1.0-HBASE-0.98.1-HADOOP1
0.96s 4.0-HBASE-0.98.1-HADOOP1

select /*+NO_INDEX*/ count(core) from INDEXED_TABLE where core > 0
1.78s V4.1.0-HBASE-0.98.1-HADOOP1
1.61s 4.0-HBASE-0.98.1-HADOOP1

select db from INDEXED_TABLE where db >5 and db <7 order by db
0.07s V4.1.0-HBASE-0.98.1-HADOOP1
0.06s 4.0-HBASE-0.98.1-HADOOP1

select /*+NO_INDEX*/ db from INDEXED_TABLE where db >5 and db <7 order by db
3.86s V4.1.0-HBASE-0.98.1-HADOOP1
3.87s 4.0-HBASE-0.98.1-HADOOP1

select db from INDEXED_TABLE order by db limit 10
0.08s V4.1.0-HBASE-0.98.1-HADOOP1
0.08s 4.0-HBASE-0.98.1-HADOOP1

select /*+NO_INDEX*/ db from INDEXED_TABLE order by db limit 10
2.43s V4.1.0-HBASE-0.98.1-HADOOP1
2.03s 4.0-HBASE-0.98.1-HADOOP1

select count(*) from INDEXED_TABLE_MUTABLE
1.47s V4.1.0-HBASE-0.98.1-HADOOP1
0.89s 4.0-HBASE-0.98.1-HADOOP1

select /*+ INDEX(INDEXED_TABLE_MUTABLE midx1 midx2 midx3 midx4) */ count(*) from INDEXED_TABLE_MUTABLE
1.91s V4.1.0-HBASE-0.98.1-HADOOP1
1.06s 4.0-HBASE-0.98.1-HADOOP1

select /*+ INDEX(INDEXED_TABLE_MUTABLE mids1 mids2 mids3 mids4) */ count(*) from INDEXED_TABLE_MUTABLE
0.68s V4.1.0-HBASE-0.98.1-HADOOP1
0.53s 4.0-HBASE-0.98.1-HADOOP1

select /*+NO_INDEX*/ count(*) from INDEXED_TABLE_MUTABLE
0.97s V4.1.0-HBASE-0.98.1-HADOOP1
0.93s 4.0-HBASE-0.98.1-HADOOP1

select round(date, 'day',50), sum(core)+2 from INDEXED_TABLE_MUTABLE where (CORE<10 or CORE>90) group by round(date, 'day',50), host
0.48s V4.1.0-HBASE-0.98.1-HADOOP1
0.52s 4.0-HBASE-0.98.1-HADOOP1

select /*+NO_INDEX*/ round(date, 'day',50), sum(core)+2 from INDEXED_TABLE_MUTABLE where (CORE<10 or CORE>90) group by round(date, 'day',50), host
1.79s V4.1.0-HBASE-0.98.1-HADOOP1
1.72s 4.0-HBASE-0.98.1-HADOOP1

select count(core) from INDEXED_TABLE_MUTABLE where core IN (1,100)
0.06s V4.1.0-HBASE-0.98.1-HADOOP1
0.06s 4.0-HBASE-0.98.1-HADOOP1

select /*+ INDEX(INDEXED_TABLE_MUTABLE midx1 midx2 midx3 midx4) */ count(core) from INDEXED_TABLE_MUTABLE where core IN (1,100)
0.05s V4.1.0-HBASE-0.98.1-HADOOP1
0.04s 4.0-HBASE-0.98.1-HADOOP1

select /*+ INDEX(INDEXED_TABLE_MUTABLE mids1 mids2 mids3 mids4) */ count(core) from INDEXED_TABLE_MUTABLE where core IN (1,100)
0.09s V4.1.0-HBASE-0.98.1-HADOOP1
0.36s 4.0-HBASE-0.98.1-HADOOP1

select /*+NO_INDEX*/ count(core) from INDEXED_TABLE_MUTABLE where core IN (1,100)
1.38s V4.1.0-HBASE-0.98.1-HADOOP1
1.49s 4.0-HBASE-0.98.1-HADOOP1

select count(core) from INDEXED_TABLE_MUTABLE where core IN (1,25,50,75,100)
0.1s V4.1.0-HBASE-0.98.1-HADOOP1
0.1s 4.0-HBASE-0.98.1-HADOOP1

select /*+ INDEX(INDEXED_TABLE_MUTABLE midx1 midx2 midx3 midx4) */ count(core) from INDEXED_TABLE_MUTABLE where core IN (1,25,50,75,100)
0.12s V4.1.0-HBASE-0.98.1-HADOOP1
0.08s 4.0-HBASE-0.98.1-HADOOP1

select /*+ INDEX(INDEXED_TABLE_MUTABLE mids1 mids2 mids3 mids4) */ count(core) from INDEXED_TABLE_MUTABLE where core IN (1,25,50,75,100)
0.09s V4.1.0-HBASE-0.98.1-HADOOP1
0.3s 4.0-HBASE-0.98.1-HADOOP1

select /*+NO_INDEX*/ count(core) from INDEXED_TABLE_MUTABLE where core IN (1,25,50,75,100)
1.38s V4.1.0-HBASE-0.98.1-HADOOP1
1.46s 4.0-HBASE-0.98.1-HADOOP1

select count(core) from INDEXED_TABLE_MUTABLE where core < 10 and db < 200
0.45s V4.1.0-HBASE-0.98.1-HADOOP1
0.43s 4.0-HBASE-0.98.1-HADOOP1

select /*+ INDEX(INDEXED_TABLE_MUTABLE midx1 midx2 midx3 midx4) */ count(core) from INDEXED_TABLE_MUTABLE where core < 10 and db < 200
0.45s V4.1.0-HBASE-0.98.1-HADOOP1
0.41s 4.0-HBASE-0.98.1-HADOOP1

select /*+ INDEX(INDEXED_TABLE_MUTABLE mids1 mids2 mids3 mids4) */ count(core) from INDEXED_TABLE_MUTABLE where core < 10 and db < 200
0.63s V4.1.0-HBASE-0.98.1-HADOOP1
0.48s 4.0-HBASE-0.98.1-HADOOP1

select /*+NO_INDEX*/ count(core) from INDEXED_TABLE_MUTABLE where core < 10 and db < 200
1.71s V4.1.0-HBASE-0.98.1-HADOOP1
1.78s 4.0-HBASE-0.98.1-HADOOP1

select count(core) from INDEXED_TABLE_MUTABLE where core < 100 and db < 2000
0.99s V4.1.0-HBASE-0.98.1-HADOOP1
0.9s 4.0-HBASE-0.98.1-HADOOP1

select /*+NO_INDEX*/ count(core) from INDEXED_TABLE_MUTABLE where core < 100 and db < 2000
1.76s V4.1.0-HBASE-0.98.1-HADOOP1
1.75s 4.0-HBASE-0.98.1-HADOOP1

select count(core) from INDEXED_TABLE_MUTABLE where core > 90
0.18s V4.1.0-HBASE-0.98.1-HADOOP1
0.22s 4.0-HBASE-0.98.1-HADOOP1

select /*+NO_INDEX*/ count(core) from INDEXED_TABLE_MUTABLE where core > 90
1.52s V4.1.0-HBASE-0.98.1-HADOOP1
1.54s 4.0-HBASE-0.98.1-HADOOP1

select count(core) from INDEXED_TABLE_MUTABLE where core > 0
0.71s V4.1.0-HBASE-0.98.1-HADOOP1
0.61s 4.0-HBASE-0.98.1-HADOOP1

select /*+NO_INDEX*/ count(core) from INDEXED_TABLE_MUTABLE where core > 0
1.43s V4.1.0-HBASE-0.98.1-HADOOP1
1.31s 4.0-HBASE-0.98.1-HADOOP1

select db from INDEXED_TABLE_MUTABLE where db >5 and db <7 order by db
0.04s V4.1.0-HBASE-0.98.1-HADOOP1
0.04s 4.0-HBASE-0.98.1-HADOOP1

select /*+NO_INDEX*/ db from INDEXED_TABLE_MUTABLE where db >5 and db <7 order by db
2.92s V4.1.0-HBASE-0.98.1-HADOOP1
3.04s 4.0-HBASE-0.98.1-HADOOP1

select db from INDEXED_TABLE_MUTABLE order by db limit 10
1.47s V4.1.0-HBASE-0.98.1-HADOOP1
1.52s 4.0-HBASE-0.98.1-HADOOP1

select /*+NO_INDEX*/ db from INDEXED_TABLE_MUTABLE order by db limit 10
1.83s V4.1.0-HBASE-0.98.1-HADOOP1
1.58s 4.0-HBASE-0.98.1-HADOOP1


Index Creation After Data

CREATE INDEX idx5 ON INDEXED_TABLE (CORE) INCLUDE (DB,ACTIVE_VISITOR)
49.33s V4.1.0-HBASE-0.98.1-HADOOP1
49.03s 4.0-HBASE-0.98.1-HADOOP1

CREATE INDEX midx5 ON INDEXED_TABLE_MUTABLE (CORE) INCLUDE (DB,ACTIVE_VISITOR)
43.75s V4.1.0-HBASE-0.98.1-HADOOP1
40.7s 4.0-HBASE-0.98.1-HADOOP1


Large Group By

select count(*) from TABLE_6CF group by A
1.13s V4.1.0-HBASE-0.98.1-HADOOP1
0.98s 4.0-HBASE-0.98.1-HADOOP1

select count(*) from TABLE_6CF group by B
3.69s V4.1.0-HBASE-0.98.1-HADOOP1
3.48s 4.0-HBASE-0.98.1-HADOOP1

select count(*) from TABLE_1CF group by A
2.17s V4.1.0-HBASE-0.98.1-HADOOP1
1.9s 4.0-HBASE-0.98.1-HADOOP1

select count(*) from TABLE_1CF group by B
2.29s V4.1.0-HBASE-0.98.1-HADOOP1
1.99s 4.0-HBASE-0.98.1-HADOOP1


Load Data

LOAD DATA AGGREGATION_TABLE [2000000 ROWS]
139.19s V4.1.0-HBASE-0.98.1-HADOOP1
132.58s 4.0-HBASE-0.98.1-HADOOP1

LOAD DATA IN_LIKE_TABLE [2000000 ROWS]
106.37s V4.1.0-HBASE-0.98.1-HADOOP1
110.09s 4.0-HBASE-0.98.1-HADOOP1

LOAD DATA INDEXED_TABLE [2000000 ROWS]
482.45s V4.1.0-HBASE-0.98.1-HADOOP1
497.1s 4.0-HBASE-0.98.1-HADOOP1

LOAD DATA INDEXED_TABLE_MUTABLE [2000000 ROWS]
683.16s V4.1.0-HBASE-0.98.1-HADOOP1
665.44s 4.0-HBASE-0.98.1-HADOOP1

LOAD DATA TABLE_6CF [2000000 ROWS]
126.08s V4.1.0-HBASE-0.98.1-HADOOP1
128.77s 4.0-HBASE-0.98.1-HADOOP1

LOAD DATA SALTED_TABLE [2000000 ROWS]
118.87s V4.1.0-HBASE-0.98.1-HADOOP1
119.92s 4.0-HBASE-0.98.1-HADOOP1

LOAD DATA TABLE_1CF [2000000 ROWS]
116.01s V4.1.0-HBASE-0.98.1-HADOOP1
117.35s 4.0-HBASE-0.98.1-HADOOP1

LOAD DATA WIDE_PK [2000000 ROWS]
340.16s V4.1.0-HBASE-0.98.1-HADOOP1
234.21s 4.0-HBASE-0.98.1-HADOOP1


Percentile

select percentile_cont(0.9) within group (order by active_visitor asc) from AGGREGATION_TABLE
3.24s V4.1.0-HBASE-0.98.1-HADOOP1
3.11s 4.0-HBASE-0.98.1-HADOOP1

select percentile_cont(0.1) within group (order by active_visitor desc) from AGGREGATION_TABLE
3.3s V4.1.0-HBASE-0.98.1-HADOOP1
3.1s 4.0-HBASE-0.98.1-HADOOP1

select percentile_cont(0.5) within group (order by core asc), percentile_cont(0.5) within group (order by db asc), percentile_cont(0.5) within group (order by active_visitor asc) from AGGREGATION_TABLE
4.52s V4.1.0-HBASE-0.98.1-HADOOP1
4.36s 4.0-HBASE-0.98.1-HADOOP1

select core, percentile_cont(0.9999) within group (order by db asc) from AGGREGATION_TABLE group by CORE
2.15s V4.1.0-HBASE-0.98.1-HADOOP1
1.98s 4.0-HBASE-0.98.1-HADOOP1


Reverse Scan

select * from WIDE_PK order by mypk DESC limit 10
0.06s V4.1.0-HBASE-0.98.1-HADOOP1
0.03s 4.0-HBASE-0.98.1-HADOOP1


Salting

select count(1) from SALTED_TABLE where K1 in ('A', 'B', 'C', 'D')
1.15s V4.1.0-HBASE-0.98.1-HADOOP1
1.13s 4.0-HBASE-0.98.1-HADOOP1

select count(*) from SALTED_TABLE where D < 1000
1.32s V4.1.0-HBASE-0.98.1-HADOOP1
1.25s 4.0-HBASE-0.98.1-HADOOP1

select avg(c),avg(d) from SALTED_TABLE group by K1
5.14s V4.1.0-HBASE-0.98.1-HADOOP1
4.75s 4.0-HBASE-0.98.1-HADOOP1




Queries by Table



AGGREGATION_TABLE


Table used for various aggregation functions

ROWS 2000000 [2M]

DDL CREATE TABLE $TABLE (HOST CHAR(2) NOT NULL,DOMAIN VARCHAR NOT NULL,FEATURE VARCHAR NOT NULL,DATE DATE NOT NULL,USAGE.CORE BIGINT,USAGE.DB BIGINT,STATS.ACTIVE_VISITOR INTEGER CONSTRAINT PK PRIMARY KEY (HOST, DOMAIN, FEATURE, DATE)) SPLIT ON ('CSGoogle','CSSalesforce','EUApple','EUGoogle','EUSalesforce','NAApple','NAGoogle','NASalesforce')

DATA GENERATOR
STRING :: Values: NA|CS|EU
STRING :: Values: Salesforce.com|Apple.com|Google.com|Yelp.com
STRING :: Values: Login|Report|Dashboard|Sales|UI
DATE :: Values: SEQUENTIAL
INTEGER :: Max. Value: 100 Values: RANDOM
INTEGER :: Max. Value: 2000 Values: RANDOM
INTEGER :: Max. Value: 10000 Values: RANDOM

select count(*) from AGGREGATION_TABLE
0.66s V4.1.0-HBASE-0.98.1-HADOOP1
0.58s 4.0-HBASE-0.98.1-HADOOP1

select count(1) from AGGREGATION_TABLE group by HOST
0.67s V4.1.0-HBASE-0.98.1-HADOOP1
0.58s 4.0-HBASE-0.98.1-HADOOP1

select core, count(1) from AGGREGATION_TABLE group by CORE
0.8s V4.1.0-HBASE-0.98.1-HADOOP1
0.76s 4.0-HBASE-0.98.1-HADOOP1

select core, host, sum(ACTIVE_VISITOR) from AGGREGATION_TABLE group by core, host
3.35s V4.1.0-HBASE-0.98.1-HADOOP1
3.25s 4.0-HBASE-0.98.1-HADOOP1

select AVG(DB), MIN(CORE), MAX(ACTIVE_VISITOR) from AGGREGATION_TABLE where host='CS' and DOMAIN<>'Google.com'
3.99s V4.1.0-HBASE-0.98.1-HADOOP1
4.03s 4.0-HBASE-0.98.1-HADOOP1

select round(date, 'day',50), sum(core)+2 from AGGREGATION_TABLE where (CORE<10 or CORE>90) group by round(date, 'day',50), host
1.35s V4.1.0-HBASE-0.98.1-HADOOP1
1.27s 4.0-HBASE-0.98.1-HADOOP1

select trunc(date, 'hour', 1000), count(DB), count(ACTIVE_VISITOR) from AGGREGATION_TABLE where feature='Login' and (core<50 or db<20 or active_visitor > 200) group by trunc(date, 'hour', 1000)
2.79s V4.1.0-HBASE-0.98.1-HADOOP1
2.66s 4.0-HBASE-0.98.1-HADOOP1

select count(active_visitor) count from AGGREGATION_TABLE
2.94s V4.1.0-HBASE-0.98.1-HADOOP1
2.78s 4.0-HBASE-0.98.1-HADOOP1

select count(distinct active_visitor) count from AGGREGATION_TABLE
3.32s V4.1.0-HBASE-0.98.1-HADOOP1
3.09s 4.0-HBASE-0.98.1-HADOOP1

select percentile_cont(0.9) within group (order by active_visitor asc) from AGGREGATION_TABLE
3.24s V4.1.0-HBASE-0.98.1-HADOOP1
3.11s 4.0-HBASE-0.98.1-HADOOP1

select percentile_cont(0.1) within group (order by active_visitor desc) from AGGREGATION_TABLE
3.3s V4.1.0-HBASE-0.98.1-HADOOP1
3.1s 4.0-HBASE-0.98.1-HADOOP1

select count(core), count(db), count(active_visitor) from AGGREGATION_TABLE
3.87s V4.1.0-HBASE-0.98.1-HADOOP1
3.68s 4.0-HBASE-0.98.1-HADOOP1

select count(distinct core), count(distinct db), count(distinct active_visitor) from AGGREGATION_TABLE
4.5s V4.1.0-HBASE-0.98.1-HADOOP1
4.35s 4.0-HBASE-0.98.1-HADOOP1

select percentile_cont(0.5) within group (order by core asc), percentile_cont(0.5) within group (order by db asc), percentile_cont(0.5) within group (order by active_visitor asc) from AGGREGATION_TABLE
4.52s V4.1.0-HBASE-0.98.1-HADOOP1
4.36s 4.0-HBASE-0.98.1-HADOOP1

select core, count(db) count from AGGREGATION_TABLE group by CORE
0.84s V4.1.0-HBASE-0.98.1-HADOOP1
0.74s 4.0-HBASE-0.98.1-HADOOP1

select core, count(distinct db) count from AGGREGATION_TABLE group by CORE
2.07s V4.1.0-HBASE-0.98.1-HADOOP1
1.92s 4.0-HBASE-0.98.1-HADOOP1

select core, percentile_cont(0.9999) within group (order by db asc) from AGGREGATION_TABLE group by CORE
2.15s V4.1.0-HBASE-0.98.1-HADOOP1
1.98s 4.0-HBASE-0.98.1-HADOOP1

select count(core) from AGGREGATION_TABLE where core IN (1,25,50,75,100)
1.15s V4.1.0-HBASE-0.98.1-HADOOP1
1.06s 4.0-HBASE-0.98.1-HADOOP1

select count(core) from AGGREGATION_TABLE where core < 10 and db < 200
1.34s V4.1.0-HBASE-0.98.1-HADOOP1
1.22s 4.0-HBASE-0.98.1-HADOOP1

select count(core) from AGGREGATION_TABLE where core < 10 and active_visitor < 1000
2.37s V4.1.0-HBASE-0.98.1-HADOOP1
2.19s 4.0-HBASE-0.98.1-HADOOP1

select count(core) from AGGREGATION_TABLE where core > 90
1.19s V4.1.0-HBASE-0.98.1-HADOOP1
1.09s 4.0-HBASE-0.98.1-HADOOP1

LOAD DATA AGGREGATION_TABLE [2000000 ROWS]
139.19s V4.1.0-HBASE-0.98.1-HADOOP1
132.58s 4.0-HBASE-0.98.1-HADOOP1


IN_LIKE_TABLE


Phoenix 1.2+ uses skip scan that gives significant performance improvement for IN/LIKE queries.

ROWS 2000000 [2M]

DDL CREATE TABLE IF NOT EXISTS $TABLE (K1 CHAR(1) NOT NULL, K2 VARCHAR NOT NULL, CF.A INTEGER, CF.B VARCHAR, CF.C VARCHAR CONSTRAINT PK PRIMARY KEY (K1,K2)) SPLIT ON ('B','C','D','E','F','G','H','I')

DATA GENERATOR
STRING :: Values: A|B|C|D|E|F|G|H|I
STRING :: Length: 10 Values: SEQUENTIAL
INTEGER :: Max. Value: 1000000 Values: RANDOM
STRING :: Length: 50 Values: RANDOM
STRING :: Length: 50 Values: RANDOM

select count(1) from IN_LIKE_TABLE where K1 in ('Z', 'D', 'F', 'X')
0.88s V4.1.0-HBASE-0.98.1-HADOOP1
0.81s 4.0-HBASE-0.98.1-HADOOP1

select * from IN_LIKE_TABLE where K1 in ('A','B') and K2 in ('xxx1000000','xxx2000000','xxx2000001')
0.01s V4.1.0-HBASE-0.98.1-HADOOP1
0.01s 4.0-HBASE-0.98.1-HADOOP1

select * from IN_LIKE_TABLE where K1 in ('A', 'C', 'E', 'F', 'H') and K2 like 'xxxxxx1%'
0.03s V4.1.0-HBASE-0.98.1-HADOOP1
0.03s 4.0-HBASE-0.98.1-HADOOP1

select count(*) from IN_LIKE_TABLE where K1 in ('X','A','B','C','D','E','F','G','H','I','Z') and K2 like '%1%'
278.34s V4.1.0-HBASE-0.98.1-HADOOP1
132.81s 4.0-HBASE-0.98.1-HADOOP1

select count(*) from IN_LIKE_TABLE where (K1 in ('A','E','F','G','H','I','Z') or K1 like 'E%') and (K2 like '%xx1%' or K2 like '%xxxxxx2%')
125.66s V4.1.0-HBASE-0.98.1-HADOOP1
60.88s 4.0-HBASE-0.98.1-HADOOP1

LOAD DATA IN_LIKE_TABLE [2000000 ROWS]
106.37s V4.1.0-HBASE-0.98.1-HADOOP1
110.09s 4.0-HBASE-0.98.1-HADOOP1


INDEXED_TABLE


Indexing test. Phoenix 2.0+ feature. See explain plan by hovering over version label to see which index table is used.

ROWS 2000000 [2M]

DDL CREATE TABLE $TABLE (HOST CHAR(2) NOT NULL,DOMAIN VARCHAR NOT NULL,FEATURE VARCHAR NOT NULL,DATE DATE NOT NULL,USAGE.CORE BIGINT,USAGE.DB BIGINT,STATS.ACTIVE_VISITOR INTEGER CONSTRAINT PK PRIMARY KEY (HOST, DOMAIN, FEATURE, DATE)) IMMUTABLE_ROWS=true,MAX_FILESIZE=30485760;CREATE INDEX idx1 ON $TABLE (CORE);CREATE INDEX idx2 ON $TABLE (DB);CREATE INDEX idx3 ON $TABLE (DB,ACTIVE_VISITOR);CREATE INDEX idx4 ON $TABLE (CORE,DB,ACTIVE_VISITOR);CREATE INDEX ids1 ON $TABLE (CORE) SALT_BUCKETS=16;CREATE INDEX ids2 ON $TABLE (DB) SALT_BUCKETS=16;CREATE INDEX ids3 ON $TABLE (DB,ACTIVE_VISITOR) SALT_BUCKETS=16;CREATE INDEX ids4 ON $TABLE (CORE,DB,ACTIVE_VISITOR) SALT_BUCKETS=16;

DATA GENERATOR
STRING :: Values: NA|CS|EU
STRING :: Values: Salesforce.com|Apple.com|Google.com|Yelp.com
STRING :: Values: Login|Report|Dashboard|Sales|UI
DATE :: Values: SEQUENTIAL
INTEGER :: Max. Value: 100 Values: RANDOM
INTEGER :: Max. Value: 2000 Values: RANDOM
INTEGER :: Max. Value: 10000 Values: RANDOM

select count(*) from INDEXED_TABLE
1.02s V4.1.0-HBASE-0.98.1-HADOOP1
0.78s 4.0-HBASE-0.98.1-HADOOP1

select /*+ INDEX(INDEXED_TABLE idx1 idx2 idx3 idx4) */ count(*) from INDEXED_TABLE
1.21s V4.1.0-HBASE-0.98.1-HADOOP1
1.11s 4.0-HBASE-0.98.1-HADOOP1

select /*+ INDEX(INDEXED_TABLE ids1 ids2 ids3 ids4) */ count(*) from INDEXED_TABLE
0.4s V4.1.0-HBASE-0.98.1-HADOOP1
0.38s 4.0-HBASE-0.98.1-HADOOP1

select /*+NO_INDEX*/ count(*) from INDEXED_TABLE
1.35s V4.1.0-HBASE-0.98.1-HADOOP1
1.16s 4.0-HBASE-0.98.1-HADOOP1

select round(date, 'day',50), sum(core)+2 from INDEXED_TABLE where (CORE<10 or CORE>90) group by round(date, 'day',50), host
0.61s V4.1.0-HBASE-0.98.1-HADOOP1
0.63s 4.0-HBASE-0.98.1-HADOOP1

select /*+NO_INDEX*/ round(date, 'day',50), sum(core)+2 from INDEXED_TABLE where (CORE<10 or CORE>90) group by round(date, 'day',50), host
1.95s V4.1.0-HBASE-0.98.1-HADOOP1
2.05s 4.0-HBASE-0.98.1-HADOOP1

select count(core) from INDEXED_TABLE where core IN (1,100)
0.07s V4.1.0-HBASE-0.98.1-HADOOP1
0.06s 4.0-HBASE-0.98.1-HADOOP1

select /*+ INDEX(INDEXED_TABLE idx1 idx2 idx3 idx4) */ count(core) from INDEXED_TABLE where core IN (1,100)
0.05s V4.1.0-HBASE-0.98.1-HADOOP1
0.05s 4.0-HBASE-0.98.1-HADOOP1

select /*+ INDEX(INDEXED_TABLE ids1 ids2 ids3 ids4) */ count(core) from INDEXED_TABLE where core IN (1,100)
0.09s V4.1.0-HBASE-0.98.1-HADOOP1
0.06s 4.0-HBASE-0.98.1-HADOOP1

select /*+NO_INDEX*/ count(core) from INDEXED_TABLE where core IN (1,100)
1.65s V4.1.0-HBASE-0.98.1-HADOOP1
1.66s 4.0-HBASE-0.98.1-HADOOP1

select count(core) from INDEXED_TABLE where core IN (1,25,50,75,100)
0.15s V4.1.0-HBASE-0.98.1-HADOOP1
0.11s 4.0-HBASE-0.98.1-HADOOP1

select /*+ INDEX(INDEXED_TABLE idx1 idx2 idx3 idx4) */ count(core) from INDEXED_TABLE where core IN (1,25,50,75,100)
0.11s V4.1.0-HBASE-0.98.1-HADOOP1
0.13s 4.0-HBASE-0.98.1-HADOOP1

select /*+ INDEX(INDEXED_TABLE ids1 ids2 ids3 ids4) */ count(core) from INDEXED_TABLE where core IN (1,25,50,75,100)
0.11s V4.1.0-HBASE-0.98.1-HADOOP1
0.11s 4.0-HBASE-0.98.1-HADOOP1

select /*+NO_INDEX*/ count(core) from INDEXED_TABLE where core IN (1,25,50,75,100)
1.7s V4.1.0-HBASE-0.98.1-HADOOP1
1.68s 4.0-HBASE-0.98.1-HADOOP1

select count(core) from INDEXED_TABLE where core < 10 and db < 200
0.7s V4.1.0-HBASE-0.98.1-HADOOP1
0.7s 4.0-HBASE-0.98.1-HADOOP1

select /*+ INDEX(INDEXED_TABLE idx1 idx2 idx3 idx4) */ count(core) from INDEXED_TABLE where core < 10 and db < 200
0.69s V4.1.0-HBASE-0.98.1-HADOOP1
0.7s 4.0-HBASE-0.98.1-HADOOP1

select /*+ INDEX(INDEXED_TABLE ids1 ids2 ids3 ids4) */ count(core) from INDEXED_TABLE where core < 10 and db < 200
0.22s V4.1.0-HBASE-0.98.1-HADOOP1
0.23s 4.0-HBASE-0.98.1-HADOOP1

select /*+NO_INDEX*/ count(core) from INDEXED_TABLE where core < 10 and db < 200
1.97s V4.1.0-HBASE-0.98.1-HADOOP1
1.94s 4.0-HBASE-0.98.1-HADOOP1

select count(core) from INDEXED_TABLE where core < 100 and db < 2000
1.83s V4.1.0-HBASE-0.98.1-HADOOP1
1.42s 4.0-HBASE-0.98.1-HADOOP1

select /*+NO_INDEX*/ count(core) from INDEXED_TABLE where core < 100 and db < 2000
2.01s V4.1.0-HBASE-0.98.1-HADOOP1
1.99s 4.0-HBASE-0.98.1-HADOOP1

select count(core) from INDEXED_TABLE where core > 90
0.16s V4.1.0-HBASE-0.98.1-HADOOP1
0.25s 4.0-HBASE-0.98.1-HADOOP1

select /*+NO_INDEX*/ count(core) from INDEXED_TABLE where core > 90
1.76s V4.1.0-HBASE-0.98.1-HADOOP1
1.71s 4.0-HBASE-0.98.1-HADOOP1

select count(core) from INDEXED_TABLE where core > 0
1.26s V4.1.0-HBASE-0.98.1-HADOOP1
0.96s 4.0-HBASE-0.98.1-HADOOP1

select /*+NO_INDEX*/ count(core) from INDEXED_TABLE where core > 0
1.78s V4.1.0-HBASE-0.98.1-HADOOP1
1.61s 4.0-HBASE-0.98.1-HADOOP1

select db from INDEXED_TABLE where db >5 and db <7 order by db
0.07s V4.1.0-HBASE-0.98.1-HADOOP1
0.06s 4.0-HBASE-0.98.1-HADOOP1

select /*+NO_INDEX*/ db from INDEXED_TABLE where db >5 and db <7 order by db
3.86s V4.1.0-HBASE-0.98.1-HADOOP1
3.87s 4.0-HBASE-0.98.1-HADOOP1

select db from INDEXED_TABLE order by db limit 10
0.08s V4.1.0-HBASE-0.98.1-HADOOP1
0.08s 4.0-HBASE-0.98.1-HADOOP1

select /*+NO_INDEX*/ db from INDEXED_TABLE order by db limit 10
2.43s V4.1.0-HBASE-0.98.1-HADOOP1
2.03s 4.0-HBASE-0.98.1-HADOOP1

CREATE INDEX idx5 ON INDEXED_TABLE (CORE) INCLUDE (DB,ACTIVE_VISITOR)
49.33s V4.1.0-HBASE-0.98.1-HADOOP1
49.03s 4.0-HBASE-0.98.1-HADOOP1

LOAD DATA INDEXED_TABLE [2000000 ROWS]
482.45s V4.1.0-HBASE-0.98.1-HADOOP1
497.1s 4.0-HBASE-0.98.1-HADOOP1


INDEXED_TABLE_MUTABLE


Indexing test. Phoenix 2.0+ feature. See explain plan by hovering over version label to see which index table is used.

ROWS 2000000 [2M]

DDL CREATE TABLE $TABLE (HOST CHAR(2) NOT NULL,DOMAIN VARCHAR NOT NULL,FEATURE VARCHAR NOT NULL,DATE DATE NOT NULL,USAGE.CORE BIGINT,USAGE.DB BIGINT,STATS.ACTIVE_VISITOR INTEGER CONSTRAINT PK PRIMARY KEY (HOST, DOMAIN, FEATURE, DATE)) MAX_FILESIZE=30485760;CREATE INDEX midx1 ON $TABLE (CORE);CREATE INDEX midx2 ON $TABLE (DB);CREATE INDEX midx3 ON $TABLE (DB,ACTIVE_VISITOR);CREATE INDEX midx4 ON $TABLE (CORE,DB,ACTIVE_VISITOR);CREATE INDEX mids1 ON $TABLE (CORE) SALT_BUCKETS=16;CREATE INDEX mids2 ON $TABLE (DB) SALT_BUCKETS=16;CREATE INDEX mids3 ON $TABLE (DB,ACTIVE_VISITOR) SALT_BUCKETS=16;CREATE INDEX mids4 ON $TABLE (CORE,DB,ACTIVE_VISITOR) SALT_BUCKETS=16;

DATA GENERATOR
STRING :: Values: NA|CS|EU
STRING :: Values: Salesforce.com|Apple.com|Google.com|Yelp.com
STRING :: Values: Login|Report|Dashboard|Sales|UI
DATE :: Values: SEQUENTIAL
INTEGER :: Max. Value: 100 Values: RANDOM
INTEGER :: Max. Value: 2000 Values: RANDOM
INTEGER :: Max. Value: 10000 Values: RANDOM

select count(*) from INDEXED_TABLE_MUTABLE
1.47s V4.1.0-HBASE-0.98.1-HADOOP1
0.89s 4.0-HBASE-0.98.1-HADOOP1

select /*+ INDEX(INDEXED_TABLE_MUTABLE midx1 midx2 midx3 midx4) */ count(*) from INDEXED_TABLE_MUTABLE
1.91s V4.1.0-HBASE-0.98.1-HADOOP1
1.06s 4.0-HBASE-0.98.1-HADOOP1

select /*+ INDEX(INDEXED_TABLE_MUTABLE mids1 mids2 mids3 mids4) */ count(*) from INDEXED_TABLE_MUTABLE
0.68s V4.1.0-HBASE-0.98.1-HADOOP1
0.53s 4.0-HBASE-0.98.1-HADOOP1

select /*+NO_INDEX*/ count(*) from INDEXED_TABLE_MUTABLE
0.97s V4.1.0-HBASE-0.98.1-HADOOP1
0.93s 4.0-HBASE-0.98.1-HADOOP1

select round(date, 'day',50), sum(core)+2 from INDEXED_TABLE_MUTABLE where (CORE<10 or CORE>90) group by round(date, 'day',50), host
0.48s V4.1.0-HBASE-0.98.1-HADOOP1
0.52s 4.0-HBASE-0.98.1-HADOOP1

select /*+NO_INDEX*/ round(date, 'day',50), sum(core)+2 from INDEXED_TABLE_MUTABLE where (CORE<10 or CORE>90) group by round(date, 'day',50), host
1.79s V4.1.0-HBASE-0.98.1-HADOOP1
1.72s 4.0-HBASE-0.98.1-HADOOP1

select count(core) from INDEXED_TABLE_MUTABLE where core IN (1,100)
0.06s V4.1.0-HBASE-0.98.1-HADOOP1
0.06s 4.0-HBASE-0.98.1-HADOOP1

select /*+ INDEX(INDEXED_TABLE_MUTABLE midx1 midx2 midx3 midx4) */ count(core) from INDEXED_TABLE_MUTABLE where core IN (1,100)
0.05s V4.1.0-HBASE-0.98.1-HADOOP1
0.04s 4.0-HBASE-0.98.1-HADOOP1

select /*+ INDEX(INDEXED_TABLE_MUTABLE mids1 mids2 mids3 mids4) */ count(core) from INDEXED_TABLE_MUTABLE where core IN (1,100)
0.09s V4.1.0-HBASE-0.98.1-HADOOP1
0.36s 4.0-HBASE-0.98.1-HADOOP1

select /*+NO_INDEX*/ count(core) from INDEXED_TABLE_MUTABLE where core IN (1,100)
1.38s V4.1.0-HBASE-0.98.1-HADOOP1
1.49s 4.0-HBASE-0.98.1-HADOOP1

select count(core) from INDEXED_TABLE_MUTABLE where core IN (1,25,50,75,100)
0.1s V4.1.0-HBASE-0.98.1-HADOOP1
0.1s 4.0-HBASE-0.98.1-HADOOP1

select /*+ INDEX(INDEXED_TABLE_MUTABLE midx1 midx2 midx3 midx4) */ count(core) from INDEXED_TABLE_MUTABLE where core IN (1,25,50,75,100)
0.12s V4.1.0-HBASE-0.98.1-HADOOP1
0.08s 4.0-HBASE-0.98.1-HADOOP1

select /*+ INDEX(INDEXED_TABLE_MUTABLE mids1 mids2 mids3 mids4) */ count(core) from INDEXED_TABLE_MUTABLE where core IN (1,25,50,75,100)
0.09s V4.1.0-HBASE-0.98.1-HADOOP1
0.3s 4.0-HBASE-0.98.1-HADOOP1

select /*+NO_INDEX*/ count(core) from INDEXED_TABLE_MUTABLE where core IN (1,25,50,75,100)
1.38s V4.1.0-HBASE-0.98.1-HADOOP1
1.46s 4.0-HBASE-0.98.1-HADOOP1

select count(core) from INDEXED_TABLE_MUTABLE where core < 10 and db < 200
0.45s V4.1.0-HBASE-0.98.1-HADOOP1
0.43s 4.0-HBASE-0.98.1-HADOOP1

select /*+ INDEX(INDEXED_TABLE_MUTABLE midx1 midx2 midx3 midx4) */ count(core) from INDEXED_TABLE_MUTABLE where core < 10 and db < 200
0.45s V4.1.0-HBASE-0.98.1-HADOOP1
0.41s 4.0-HBASE-0.98.1-HADOOP1

select /*+ INDEX(INDEXED_TABLE_MUTABLE mids1 mids2 mids3 mids4) */ count(core) from INDEXED_TABLE_MUTABLE where core < 10 and db < 200
0.63s V4.1.0-HBASE-0.98.1-HADOOP1
0.48s 4.0-HBASE-0.98.1-HADOOP1

select /*+NO_INDEX*/ count(core) from INDEXED_TABLE_MUTABLE where core < 10 and db < 200
1.71s V4.1.0-HBASE-0.98.1-HADOOP1
1.78s 4.0-HBASE-0.98.1-HADOOP1

select count(core) from INDEXED_TABLE_MUTABLE where core < 100 and db < 2000
0.99s V4.1.0-HBASE-0.98.1-HADOOP1
0.9s 4.0-HBASE-0.98.1-HADOOP1

select /*+NO_INDEX*/ count(core) from INDEXED_TABLE_MUTABLE where core < 100 and db < 2000
1.76s V4.1.0-HBASE-0.98.1-HADOOP1
1.75s 4.0-HBASE-0.98.1-HADOOP1

select count(core) from INDEXED_TABLE_MUTABLE where core > 90
0.18s V4.1.0-HBASE-0.98.1-HADOOP1
0.22s 4.0-HBASE-0.98.1-HADOOP1

select /*+NO_INDEX*/ count(core) from INDEXED_TABLE_MUTABLE where core > 90
1.52s V4.1.0-HBASE-0.98.1-HADOOP1
1.54s 4.0-HBASE-0.98.1-HADOOP1

select count(core) from INDEXED_TABLE_MUTABLE where core > 0
0.71s V4.1.0-HBASE-0.98.1-HADOOP1
0.61s 4.0-HBASE-0.98.1-HADOOP1

select /*+NO_INDEX*/ count(core) from INDEXED_TABLE_MUTABLE where core > 0
1.43s V4.1.0-HBASE-0.98.1-HADOOP1
1.31s 4.0-HBASE-0.98.1-HADOOP1

select db from INDEXED_TABLE_MUTABLE where db >5 and db <7 order by db
0.04s V4.1.0-HBASE-0.98.1-HADOOP1
0.04s 4.0-HBASE-0.98.1-HADOOP1

select /*+NO_INDEX*/ db from INDEXED_TABLE_MUTABLE where db >5 and db <7 order by db
2.92s V4.1.0-HBASE-0.98.1-HADOOP1
3.04s 4.0-HBASE-0.98.1-HADOOP1

select db from INDEXED_TABLE_MUTABLE order by db limit 10
1.47s V4.1.0-HBASE-0.98.1-HADOOP1
1.52s 4.0-HBASE-0.98.1-HADOOP1

select /*+NO_INDEX*/ db from INDEXED_TABLE_MUTABLE order by db limit 10
1.83s V4.1.0-HBASE-0.98.1-HADOOP1
1.58s 4.0-HBASE-0.98.1-HADOOP1

CREATE INDEX midx5 ON INDEXED_TABLE_MUTABLE (CORE) INCLUDE (DB,ACTIVE_VISITOR)
43.75s V4.1.0-HBASE-0.98.1-HADOOP1
40.7s 4.0-HBASE-0.98.1-HADOOP1

LOAD DATA INDEXED_TABLE_MUTABLE [2000000 ROWS]
683.16s V4.1.0-HBASE-0.98.1-HADOOP1
665.44s 4.0-HBASE-0.98.1-HADOOP1


TABLE_6CF


Data is split in 6 column families. Phoenix 1.2+ uses Essential Column Family filter feature which fetches only required columns when filtering rows.

ROWS 2000000 [2M]

DDL CREATE TABLE IF NOT EXISTS $TABLE (K1 CHAR(1) NOT NULL, K2 VARCHAR NOT NULL, CF1.A INTEGER, CF2.B INTEGER, CF3.C INTEGER, CF4.D INTEGER, CF5.E INTEGER, CF6.F INTEGER CONSTRAINT PK PRIMARY KEY (K1,K2)) SPLIT ON ('B','C','D');CREATE TABLE IF NOT EXISTS $TABLE_UPSERTSELECT (K1 CHAR(1) NOT NULL, K2 VARCHAR NOT NULL, CF1.A INTEGER, CF2.B INTEGER, CF3.C INTEGER, CF4.D INTEGER, CF5.E INTEGER, CF6.F INTEGER CONSTRAINT PK PRIMARY KEY (K1,K2)) SPLIT ON ('B','C','D')

DATA GENERATOR
STRING :: Values: A|B|C|D
STRING :: Length: 10 Values: SEQUENTIAL
INTEGER :: Max. Value: 100 Values: RANDOM
INTEGER :: Max. Value: 1000 Values: RANDOM
INTEGER :: Max. Value: 2000 Values: RANDOM
INTEGER :: Max. Value: 5000 Values: RANDOM
INTEGER :: Max. Value: 10000 Values: RANDOM
INTEGER :: Max. Value: 15000 Values: RANDOM

select count(1) from TABLE_6CF where K1 in ('A', 'B', 'C', 'D')
1.02s V4.1.0-HBASE-0.98.1-HADOOP1
0.94s 4.0-HBASE-0.98.1-HADOOP1

select count(1) from TABLE_6CF where K1 in ('A', 'C')
0.78s V4.1.0-HBASE-0.98.1-HADOOP1
0.75s 4.0-HBASE-0.98.1-HADOOP1

select count(*) from TABLE_6CF where f < 1000
1.69s V4.1.0-HBASE-0.98.1-HADOOP1
1.6s 4.0-HBASE-0.98.1-HADOOP1

select a,b,c,d,e,f from TABLE_6CF where B>1000 and B<2000 and f>1000 and f<2000
2.58s V4.1.0-HBASE-0.98.1-HADOOP1
2.44s 4.0-HBASE-0.98.1-HADOOP1

select sum(a),sum(b),sum(c),sum(d) from TABLE_6CF group by K1
6.22s V4.1.0-HBASE-0.98.1-HADOOP1
5.95s 4.0-HBASE-0.98.1-HADOOP1

select count(*) from TABLE_6CF group by A
1.13s V4.1.0-HBASE-0.98.1-HADOOP1
0.98s 4.0-HBASE-0.98.1-HADOOP1

select count(*) from TABLE_6CF group by B
3.69s V4.1.0-HBASE-0.98.1-HADOOP1
3.48s 4.0-HBASE-0.98.1-HADOOP1

select count(*) from TABLE_6CF where f < 10000
3.17s V4.1.0-HBASE-0.98.1-HADOOP1
2.96s 4.0-HBASE-0.98.1-HADOOP1

LOAD DATA TABLE_6CF [2000000 ROWS]
126.08s V4.1.0-HBASE-0.98.1-HADOOP1
128.77s 4.0-HBASE-0.98.1-HADOOP1


SALTED_TABLE


This is Phoenix 1.2+ feature. Data is split in 4 regions equal to number of region servers in test cluster by adding salted byte to each key.

ROWS 2000000 [2M]

DDL CREATE TABLE $TABLE (K1 CHAR(1) NOT NULL, K2 VARCHAR NOT NULL, CFA.A VARCHAR, CFA.B CHAR(100), CFA.C INTEGER, CFB.D INTEGER CONSTRAINT PK PRIMARY KEY (K1,K2)) SALT_BUCKETS=4

DATA GENERATOR
STRING :: Values: A|B|C|D
STRING :: Length: 10 Values: SEQUENTIAL
STRING :: Length: 100 Values: RANDOM
STRING :: Length: 100 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM

select count(1) from SALTED_TABLE where K1 in ('A', 'B', 'C', 'D')
1.15s V4.1.0-HBASE-0.98.1-HADOOP1
1.13s 4.0-HBASE-0.98.1-HADOOP1

select count(*) from SALTED_TABLE where D < 1000
1.32s V4.1.0-HBASE-0.98.1-HADOOP1
1.25s 4.0-HBASE-0.98.1-HADOOP1

select avg(c),avg(d) from SALTED_TABLE group by K1
5.14s V4.1.0-HBASE-0.98.1-HADOOP1
4.75s 4.0-HBASE-0.98.1-HADOOP1

LOAD DATA SALTED_TABLE [2000000 ROWS]
118.87s V4.1.0-HBASE-0.98.1-HADOOP1
119.92s 4.0-HBASE-0.98.1-HADOOP1


TABLE_1CF


Same data as in 6 column family table but this one only has a single column family. Performance should be worse in most cases.

ROWS 2000000 [2M]

DDL CREATE TABLE IF NOT EXISTS $TABLE (K1 CHAR(1) NOT NULL, K2 VARCHAR NOT NULL, CF.A INTEGER, CF.B INTEGER, CF.C INTEGER, CF.D INTEGER, CF.E INTEGER, CF.F INTEGER CONSTRAINT PK PRIMARY KEY (K1,K2)) SPLIT ON ('B','C','D');CREATE TABLE IF NOT EXISTS $TABLE_UPSERTSELECT (K1 CHAR(1) NOT NULL, K2 VARCHAR NOT NULL, CF.A INTEGER, CF.B INTEGER, CF.C INTEGER, CF.D INTEGER, CF.E INTEGER, CF.F INTEGER CONSTRAINT PK PRIMARY KEY (K1,K2)) SPLIT ON ('B','C','D')

DATA GENERATOR
STRING :: Values: A|B|C|D
STRING :: Length: 10 Values: SEQUENTIAL
INTEGER :: Max. Value: 100 Values: RANDOM
INTEGER :: Max. Value: 1000 Values: RANDOM
INTEGER :: Max. Value: 2000 Values: RANDOM
INTEGER :: Max. Value: 5000 Values: RANDOM
INTEGER :: Max. Value: 10000 Values: RANDOM
INTEGER :: Max. Value: 15000 Values: RANDOM

select count(1) from TABLE_1CF where K1 in ('A', 'B', 'C', 'D')
2.34s V4.1.0-HBASE-0.98.1-HADOOP1
2.12s 4.0-HBASE-0.98.1-HADOOP1

select count(1) from TABLE_1CF where K1 in ('A', 'C')
2.04s V4.1.0-HBASE-0.98.1-HADOOP1
1.83s 4.0-HBASE-0.98.1-HADOOP1

select count(*) from TABLE_1CF where f < 1000
2.5s V4.1.0-HBASE-0.98.1-HADOOP1
2.3s 4.0-HBASE-0.98.1-HADOOP1

select a,b,c,d,e,f from TABLE_1CF where B>1000 and B<2000 and f>1000 and f<2000
3.33s V4.1.0-HBASE-0.98.1-HADOOP1
3.1s 4.0-HBASE-0.98.1-HADOOP1

select sum(a),sum(b),sum(c),sum(d) from TABLE_1CF group by K1
2.68s V4.1.0-HBASE-0.98.1-HADOOP1
2.33s 4.0-HBASE-0.98.1-HADOOP1

select count(*) from TABLE_1CF group by A
2.17s V4.1.0-HBASE-0.98.1-HADOOP1
1.9s 4.0-HBASE-0.98.1-HADOOP1

select count(*) from TABLE_1CF group by B
2.29s V4.1.0-HBASE-0.98.1-HADOOP1
1.99s 4.0-HBASE-0.98.1-HADOOP1

select count(*) from TABLE_1CF where f < 10000
2.34s V4.1.0-HBASE-0.98.1-HADOOP1
2.16s 4.0-HBASE-0.98.1-HADOOP1

LOAD DATA TABLE_1CF [2000000 ROWS]
116.01s V4.1.0-HBASE-0.98.1-HADOOP1
117.35s 4.0-HBASE-0.98.1-HADOOP1


WIDE_PK




ROWS 2000000 [2M]

DDL CREATE TABLE IF NOT EXISTS $TABLE (mypk CHAR(500) NOT NULL PRIMARY KEY,CF.column1 INTEGER,CF.column2 INTEGER,CF.column3 INTEGER,CF.column4 INTEGER,CF.column5 INTEGER) SALT_BUCKETS=4;

DATA GENERATOR
STRING :: Length: 500 Values: SEQUENTIAL
INTEGER :: Values: SEQUENTIAL
INTEGER :: Max. Value: 100 Values: RANDOM
INTEGER :: Max. Value: 100 Values: RANDOM
INTEGER :: Max. Value: 100 Values: RANDOM
INTEGER :: Max. Value: 100 Values: RANDOM

select count(*) from WIDE_PK
2.9s V4.1.0-HBASE-0.98.1-HADOOP1
2.65s 4.0-HBASE-0.98.1-HADOOP1

select count(*) from WIDE_PK where column2<10
3.1s V4.1.0-HBASE-0.98.1-HADOOP1
2.85s 4.0-HBASE-0.98.1-HADOOP1

select * from WIDE_PK order by mypk DESC limit 10
0.06s V4.1.0-HBASE-0.98.1-HADOOP1
0.03s 4.0-HBASE-0.98.1-HADOOP1

select count(*) from WIDE_PK where column2<50 and column3<50 and column4<50 and column5<50
3.71s V4.1.0-HBASE-0.98.1-HADOOP1
3.62s 4.0-HBASE-0.98.1-HADOOP1

LOAD DATA WIDE_PK [2000000 ROWS]
340.16s V4.1.0-HBASE-0.98.1-HADOOP1
234.21s 4.0-HBASE-0.98.1-HADOOP1



Note: Hover over version label to see Phoenix Query Explain Plan.