Phoenix Performance Result :: Fri Jul 12 05:37:51 PDT 2013

AGGREGATION_TEST_TABLE
Various server side grouped/un-grouped aggregation functions. Data is pre-split in 9 regions over a 4 region server cluster.

ROWS 10000000 [10M]

DDL CREATE TABLE $TABLE (HOST CHAR(2) NOT NULL,DOMAIN VARCHAR NOT NULL,FEATURE VARCHAR NOT NULL,DATE DATE NOT NULL,USAGE.CORE BIGINT,USAGE.DB BIGINT,STATS.ACTIVE_VISITOR INTEGER CONSTRAINT PK PRIMARY KEY (HOST, DOMAIN, FEATURE, DATE)) SPLIT ON ('CSGoogle','CSSalesforce','EUApple','EUGoogle','EUSalesforce','NAApple','NAGoogle','NASalesforce')

DATA GENERATOR
STRING :: Values: NA|CS|EU
STRING :: Values: Salesforce.com|Apple.com|Google.com|Yelp.com
STRING :: Values: Login|Report|Dashboard|Sales|UI
DATE :: Values: SEQUENTIAL
INTEGER :: Max. Value: 100 Values: RANDOM
INTEGER :: Max. Value: 2000 Values: RANDOM
INTEGER :: Max. Value: 10000 Values: RANDOM

QUERIES
select count(*) from AGGREGATION_TEST_TABLE
7.36s CURRENT-SNAPSHOT
7.41s LAST-SNAPSHOT
7.48s PHOENIX-1.2.0

select count(1) from AGGREGATION_TEST_TABLE group by HOST
7.51s CURRENT-SNAPSHOT
7.6s LAST-SNAPSHOT
7.78s PHOENIX-1.2.0

select MIN(CORE) from AGGREGATION_TEST_TABLE group by DOMAIN
8.57s CURRENT-SNAPSHOT
8.42s LAST-SNAPSHOT
8.4s PHOENIX-1.2.0

select core, count(1) from AGGREGATION_TEST_TABLE group by CORE
8.31s CURRENT-SNAPSHOT
8.13s LAST-SNAPSHOT
8.36s PHOENIX-1.2.0

select core, host, sum(ACTIVE_VISITOR) from AGGREGATION_TEST_TABLE group by core, host
13.46s CURRENT-SNAPSHOT
13.5s LAST-SNAPSHOT
13.42s PHOENIX-1.2.0

select AVG(DB), MIN(CORE), MAX(ACTIVE_VISITOR) from AGGREGATION_TEST_TABLE where host='CS' and DOMAIN<>'Google.com'
17.17s CURRENT-SNAPSHOT
17.88s LAST-SNAPSHOT
18.12s PHOENIX-1.2.0

select round(date, 'day',50), sum(core)+2 from AGGREGATION_TEST_TABLE where (CORE<10 or CORE>90) group by round(date, 'day',50), host
5.77s CURRENT-SNAPSHOT
6s LAST-SNAPSHOT
5.76s PHOENIX-1.2.0

select trunc(date, 'hour', 1000), count(DB), count(ACTIVE_VISITOR) from AGGREGATION_TEST_TABLE where feature='Login' and (core<50 or db<20 or active_visitor > 200) group by trunc(date, 'hour', 1000)
7.57s CURRENT-SNAPSHOT
7.99s LAST-SNAPSHOT
8.17s PHOENIX-1.2.0

select count(active_visitor) count from AGGREGATION_TEST_TABLE
11.99s CURRENT-SNAPSHOT
11.98s LAST-SNAPSHOT
12.18s PHOENIX-1.2.0

select count(distinct active_visitor) count from AGGREGATION_TEST_TABLE
13.34s CURRENT-SNAPSHOT
13.02s LAST-SNAPSHOT
N/A for PHOENIX-1.2.0

select percentile_cont(0.9) within group (order by active_visitor asc) from AGGREGATION_TEST_TABLE
13.23s CURRENT-SNAPSHOT
13.04s LAST-SNAPSHOT
N/A for PHOENIX-1.2.0

select percentile_cont(0.1) within group (order by active_visitor desc) from AGGREGATION_TEST_TABLE
13.24s CURRENT-SNAPSHOT
13.08s LAST-SNAPSHOT
N/A for PHOENIX-1.2.0

select count(core), count(db), count(active_visitor) from AGGREGATION_TEST_TABLE
16.47s CURRENT-SNAPSHOT
16.45s LAST-SNAPSHOT
16.76s PHOENIX-1.2.0

select count(distinct core), count(distinct db), count(distinct active_visitor) from AGGREGATION_TEST_TABLE
18.92s CURRENT-SNAPSHOT
18.64s LAST-SNAPSHOT
N/A for PHOENIX-1.2.0

select percentile_cont(0.5) within group (order by core asc), percentile_cont(0.5) within group (order by db asc), percentile_cont(0.5) within group (order by active_visitor asc) from AGGREGATION_TEST_TABLE
19.04s CURRENT-SNAPSHOT
18.64s LAST-SNAPSHOT
N/A for PHOENIX-1.2.0

select core, count(db) count from AGGREGATION_TEST_TABLE group by CORE
12.18s CURRENT-SNAPSHOT
12.03s LAST-SNAPSHOT
12.39s PHOENIX-1.2.0

select core, count(distinct db) count from AGGREGATION_TEST_TABLE group by CORE
15.29s CURRENT-SNAPSHOT
15.01s LAST-SNAPSHOT
N/A for PHOENIX-1.2.0

select core, percentile_cont(0.9999) within group (order by db asc) from AGGREGATION_TEST_TABLE group by CORE
15.34s CURRENT-SNAPSHOT
15.02s LAST-SNAPSHOT
N/A for PHOENIX-1.2.0

LOAD DATA [10000000 ROWS]
315.23s CURRENT-SNAPSHOT
312.52s LAST-SNAPSHOT
361.82s PHOENIX-1.2.0


IN_LIKE_TABLE
Phoenix 1.2+ uses skip scan that gives significant performance improvement for IN/LIKE queries.

ROWS 10000000 [10M]

DDL CREATE TABLE IF NOT EXISTS $TABLE (K1 CHAR(1) NOT NULL, K2 VARCHAR NOT NULL, CF.A INTEGER, CF.B VARCHAR, CF.C VARCHAR CONSTRAINT PK PRIMARY KEY (K1,K2)) SPLIT ON ('B','C','D','E','F','G','H','I')

DATA GENERATOR
STRING :: Values: A|B|C|D|E|F|G|H|I
STRING :: Length: 10 Values: SEQUENTIAL
INTEGER :: Max. Value: 1000000 Values: RANDOM
STRING :: Length: 50 Values: RANDOM
STRING :: Length: 50 Values: RANDOM

QUERIES
select count(1) from IN_LIKE_TABLE where K1 in ('Z', 'D', 'F', 'X')
3.38s CURRENT-SNAPSHOT
3.59s LAST-SNAPSHOT
3.68s PHOENIX-1.2.0

select * from IN_LIKE_TABLE where K1 in ('A','B') and K2 in ('xxx1000000','xxx2000000','xxx2000001')
0.01s CURRENT-SNAPSHOT
0.01s LAST-SNAPSHOT
0.01s PHOENIX-1.2.0

select * from IN_LIKE_TABLE where K1 in ('A', 'C', 'E', 'F', 'H') and K2 like 'xxxxxx1%'
0.01s CURRENT-SNAPSHOT
0.01s LAST-SNAPSHOT
0.03s PHOENIX-1.2.0

select count(*) from IN_LIKE_TABLE where K1 in ('X','A','B','C','D','E','F','G','H','I','Z') and K2 like '%1%'
5.22s CURRENT-SNAPSHOT
5.65s LAST-SNAPSHOT
5.29s PHOENIX-1.2.0

select count(*) from IN_LIKE_TABLE where (K1 in ('A','E','F','G','H','I','Z') or K1 like 'E%') and (K2 like '%xx1%' or K2 like '%xxxxxx2%')
4.95s CURRENT-SNAPSHOT
5.37s LAST-SNAPSHOT
5.25s PHOENIX-1.2.0

LOAD DATA [10000000 ROWS]
266.15s CURRENT-SNAPSHOT
257.08s LAST-SNAPSHOT
314.9s PHOENIX-1.2.0


CF_TABLE_14CF
Data is split in 14 column families. Phoenix 1.2+ uses Essential Column Family filter feature which fetches only required columns when filtering rows.

ROWS 10000000 [10M]

DDL CREATE TABLE IF NOT EXISTS $TABLE (K1 CHAR(1) NOT NULL, K2 VARCHAR NOT NULL, CF1.A INTEGER, CF2.B INTEGER, CF3.C INTEGER, CF4.D INTEGER, CF5.E INTEGER, CF6.F INTEGER, CF7.G INTEGER, CF8.H INTEGER, CF9.I INTEGER, CF10.J INTEGER, CF11.K INTEGER, CF12.L INTEGER, CF13.M INTEGER, CF14.N INTEGER CONSTRAINT PK PRIMARY KEY (K1,K2)) SPLIT ON ('B','C','D')

DATA GENERATOR
STRING :: Values: A|B|C|D
STRING :: Length: 10 Values: SEQUENTIAL
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM

QUERIES
select count(1) from CF_TABLE_14CF where K1 in ('A', 'B', 'C', 'D')
8.64s CURRENT-SNAPSHOT
8.54s LAST-SNAPSHOT
8.81s PHOENIX-1.2.0

select count(1) from CF_TABLE_14CF where K1 in ('A', 'C')
7.83s CURRENT-SNAPSHOT
8.5s LAST-SNAPSHOT
8.86s PHOENIX-1.2.0

select count(*) from CF_TABLE_14CF where N < 1000
4.27s CURRENT-SNAPSHOT
4.56s LAST-SNAPSHOT
4.46s PHOENIX-1.2.0

select a,b,c,d,e,f,g,h,i,j,k,l,m,n from CF_TABLE_14CF where (B>1000 and B<2000) and (M>1000 and M<2000)
6.28s CURRENT-SNAPSHOT
6.38s LAST-SNAPSHOT
6.22s PHOENIX-1.2.0

select sum(a),sum(e),sum(j),sum(n) from CF_TABLE_14CF group by K1
26.55s CURRENT-SNAPSHOT
26.34s LAST-SNAPSHOT
26.01s PHOENIX-1.2.0

LOAD DATA [10000000 ROWS]
517.85s CURRENT-SNAPSHOT
512.7s LAST-SNAPSHOT
646.86s PHOENIX-1.2.0


SALTED_TABLE
This is Phoenix 1.2+ feature. Data is split in 4 regions equal to number of region servers in test cluster by adding salted byte to each key.

ROWS 10000000 [10M]

DDL CREATE TABLE $TABLE (K1 CHAR(1) NOT NULL, K2 VARCHAR NOT NULL, CFA.A VARCHAR, CFA.B CHAR(100), CFA.C INTEGER, CFB.D INTEGER CONSTRAINT PK PRIMARY KEY (K1,K2)) SALT_BUCKETS=4

DATA GENERATOR
STRING :: Values: A|B|C|D
STRING :: Length: 10 Values: SEQUENTIAL
STRING :: Length: 100 Values: RANDOM
STRING :: Length: 100 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM

QUERIES
select count(1) from SALTED_TABLE where K1 in ('A', 'B', 'C', 'D')
5.76s CURRENT-SNAPSHOT
6.1s LAST-SNAPSHOT
5.96s PHOENIX-1.2.0

select count(*) from SALTED_TABLE where D < 1000
2.2s CURRENT-SNAPSHOT
2.37s LAST-SNAPSHOT
2.34s PHOENIX-1.2.0

select avg(c),avg(d) from SALTED_TABLE group by K1
12.65s CURRENT-SNAPSHOT
12.25s LAST-SNAPSHOT
12.36s PHOENIX-1.2.0

LOAD DATA [10000000 ROWS]
336.44s CURRENT-SNAPSHOT
325.47s LAST-SNAPSHOT
385.41s PHOENIX-1.2.0


CF_TABLE_1CF
Same data as in 14 column family table but this one only has a single column family. Performance should be worse in most cases.

ROWS 10000000 [10M]

DDL CREATE TABLE IF NOT EXISTS $TABLE (K1 CHAR(1) NOT NULL, K2 VARCHAR NOT NULL, CF.A INTEGER, CF.B INTEGER, CF.C INTEGER, CF.D INTEGER, CF.E INTEGER, CF.F INTEGER, CF.G INTEGER, CF.H INTEGER, CF.I INTEGER, CF.J INTEGER, CF.K INTEGER, CF.L INTEGER, CF.M INTEGER, CF.N INTEGER CONSTRAINT PK PRIMARY KEY (K1,K2)) SPLIT ON ('B','C','D')

DATA GENERATOR
STRING :: Values: A|B|C|D
STRING :: Length: 10 Values: SEQUENTIAL
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM

QUERIES
select count(1) from CF_TABLE_1CF where K1 in ('A', 'B', 'C', 'D')
9s CURRENT-SNAPSHOT
8.57s LAST-SNAPSHOT
8.97s PHOENIX-1.2.0

select count(1) from CF_TABLE_1CF where K1 in ('A', 'C')
8.31s CURRENT-SNAPSHOT
8.39s LAST-SNAPSHOT
8.86s PHOENIX-1.2.0

select count(*) from CF_TABLE_1CF where N < 1000
12.23s CURRENT-SNAPSHOT
11.61s LAST-SNAPSHOT
12.41s PHOENIX-1.2.0

select a,b,c,d,e,f,g,h,i,j,k,l,m,n from CF_TABLE_1CF where B>1000 and B<2000 and M>1000 and M<2000
14.4s CURRENT-SNAPSHOT
13.94s LAST-SNAPSHOT
14.31s PHOENIX-1.2.0

select sum(a),sum(e),sum(j),sum(n) from CF_TABLE_1CF group by K1
26.77s CURRENT-SNAPSHOT
24.21s LAST-SNAPSHOT
26.57s PHOENIX-1.2.0

LOAD DATA [10000000 ROWS]
443.44s CURRENT-SNAPSHOT
435.08s LAST-SNAPSHOT
555.9s PHOENIX-1.2.0