Phoenix Performance Result :: Mon Jun 03 16:48:56 PDT 2013

AGGREGATION_TABLE
Various server side grouped/un-grouped aggregation functions. Data is pre-split in 9 regions over a 4 region server cluster.

ROWS 10000000 [10M]

DDL CREATE TABLE $TABLE (HOST CHAR(2) NOT NULL,DOMAIN VARCHAR NOT NULL,FEATURE VARCHAR NOT NULL,DATE DATE NOT NULL,USAGE.CORE BIGINT,USAGE.DB BIGINT,STATS.ACTIVE_VISITOR INTEGER CONSTRAINT PK PRIMARY KEY (HOST, DOMAIN, FEATURE, DATE)) SPLIT ON ('CSGoogle','CSSalesforce','EUApple','EUGoogle','EUSalesforce','NAApple','NAGoogle','NASalesforce')

DATA GENERATOR
STRING :: Values: NA|CS|EU
STRING :: Values: Salesforce.com|Apple.com|Google.com|Yelp.com
STRING :: Values: Login|Report|Dashboard|Sales|UI
DATE :: Values: SEQUENTIAL
INTEGER :: Max. Value: 100 Values: RANDOM
INTEGER :: Max. Value: 2000 Values: RANDOM
INTEGER :: Max. Value: 10000 Values: RANDOM

QUERIES
select trunc(date, 'hour', 1000), count(DB), count(ACTIVE_VISITOR) from AGGREGATION_TABLE where feature='Login' and (core<50 or db<20 or active_visitor > 200) group by trunc(date, 'hour', 1000)
7.63s SNAPSHOT
8.85s PHOENIX-1.2.0
11.12s PHOENIX-1.1

select round(date, 'day',50), sum(core)+2 from AGGREGATION_TABLE where (CORE<10 or CORE>90) group by round(date, 'day',50), host
5.65s SNAPSHOT
6.62s PHOENIX-1.2.0
5.45s PHOENIX-1.1

select count(1) from AGGREGATION_TABLE group by HOST
7.43s SNAPSHOT
8.68s PHOENIX-1.2.0
7.26s PHOENIX-1.1

select count(*) from AGGREGATION_TABLE
7.24s SNAPSHOT
8.42s PHOENIX-1.2.0
6.89s PHOENIX-1.1

select core, host, sum(ACTIVE_VISITOR) from AGGREGATION_TABLE group by core, host
13.22s SNAPSHOT
15.56s PHOENIX-1.2.0
13.14s PHOENIX-1.1

select core, count(1) from AGGREGATION_TABLE group by CORE
8.01s SNAPSHOT
9.44s PHOENIX-1.2.0
8.05s PHOENIX-1.1

select MIN(CORE) from AGGREGATION_TABLE group by DOMAIN
8.12s SNAPSHOT
9.53s PHOENIX-1.2.0
8.14s PHOENIX-1.1

select AVG(DB), MIN(CORE), MAX(ACTIVE_VISITOR) from AGGREGATION_TABLE where host='CS' and DOMAIN<>'Google.com'
16.62s SNAPSHOT
16.7s PHOENIX-1.2.0
17.79s PHOENIX-1.1

LOAD DATA [10000000 ROWS]
361.95s SNAPSHOT
369.66s PHOENIX-1.2.0
284.25s PHOENIX-1.1


IN_LIKE_TABLE
Phoenix 1.2+ uses skip scan that gives significant performance improvement for IN/LIKE queries.

ROWS 10000000 [10M]

DDL CREATE TABLE IF NOT EXISTS $TABLE (K1 CHAR(1) NOT NULL, K2 VARCHAR NOT NULL, CF.A INTEGER, CF.B VARCHAR, CF.C VARCHAR CONSTRAINT PK PRIMARY KEY (K1,K2)) SPLIT ON ('B','C','D','E','F','G','H','I')

DATA GENERATOR
STRING :: Values: A|B|C|D|E|F|G|H|I
STRING :: Length: 10 Values: SEQUENTIAL
INTEGER :: Max. Value: 1000000 Values: RANDOM
STRING :: Length: 50 Values: RANDOM
STRING :: Length: 50 Values: RANDOM

QUERIES
select count(1) from IN_LIKE_TABLE where K1 in ('Z', 'D', 'F', 'X')
3.71s SNAPSHOT
3.83s PHOENIX-1.2.0
3.82s PHOENIX-1.1

select count(*) from IN_LIKE_TABLE where K1 in ('X','A','B','C','D','E','F','G','H','I','Z') and K2 like '%1%'
5.07s SNAPSHOT
5.38s PHOENIX-1.2.0
4.71s PHOENIX-1.1

select count(*) from IN_LIKE_TABLE where (K1 in ('A','E','F','G','H','I','Z') or K1 like 'E%') and (K2 like '%xx1%' or K2 like '%xxxxxx2%')
5.2s SNAPSHOT
5.23s PHOENIX-1.2.0
4.85s PHOENIX-1.1

select * from IN_LIKE_TABLE where K1 in ('A','B') and K2 in ('xxx1000000','xxx2000000','xxx2000001')
0.01s SNAPSHOT
0.01s PHOENIX-1.2.0
5.82s PHOENIX-1.1

select * from IN_LIKE_TABLE where K1 in ('A', 'C', 'E', 'F', 'H') and K2 like 'xxxxxx1%'
0.02s SNAPSHOT
0.02s PHOENIX-1.2.0
25.2s PHOENIX-1.1

LOAD DATA [10000000 ROWS]
317.19s SNAPSHOT
312.94s PHOENIX-1.2.0
239.73s PHOENIX-1.1


CF_TABLE_14CF
Data is split in 14 column families. Phoenix 1.2+ uses Essential Column Family filter feature which fetches only required columns when filtering rows.

ROWS 10000000 [10M]

DDL CREATE TABLE IF NOT EXISTS $TABLE (K1 CHAR(1) NOT NULL, K2 VARCHAR NOT NULL, CF1.A INTEGER, CF2.B INTEGER, CF3.C INTEGER, CF4.D INTEGER, CF5.E INTEGER, CF6.F INTEGER, CF7.G INTEGER, CF8.H INTEGER, CF9.I INTEGER, CF10.J INTEGER, CF11.K INTEGER, CF12.L INTEGER, CF13.M INTEGER, CF14.N INTEGER CONSTRAINT PK PRIMARY KEY (K1,K2)) SPLIT ON ('B','C','D')

DATA GENERATOR
STRING :: Values: A|B|C|D
STRING :: Length: 10 Values: SEQUENTIAL
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM

QUERIES
select sum(a),sum(e),sum(j),sum(n) from CF_TABLE_14CF group by K1
35.78s SNAPSHOT
36.01s PHOENIX-1.2.0
33.65s PHOENIX-1.1

select count(1) from CF_TABLE_14CF where K1 in ('A', 'B', 'C', 'D')
11.79s SNAPSHOT
11.99s PHOENIX-1.2.0
11.54s PHOENIX-1.1

select count(*) from CF_TABLE_14CF where N < 1000
5.75s SNAPSHOT
5.92s PHOENIX-1.2.0
17.08s PHOENIX-1.1

select a,b,c,d,e,f,g,h,i,j,k,l,m,n from CF_TABLE_14CF where (B>1000 and B<2000) and (M>1000 and M<2000)
7.72s SNAPSHOT
7.96s PHOENIX-1.2.0
440.95s PHOENIX-1.1

LOAD DATA [10000000 ROWS]
642.75s SNAPSHOT
647.87s PHOENIX-1.2.0
471.45s PHOENIX-1.1


SALTED_TABLE
This is Phoenix 1.2+ feature. Data is split in 4 regions equal to number of region servers in test cluster by adding salted byte to each key.

ROWS 10000000 [10M]

DDL CREATE TABLE $TABLE (K1 CHAR(1) NOT NULL, K2 VARCHAR NOT NULL, CFA.A VARCHAR, CFA.B CHAR(100), CFA.C INTEGER, CFB.D INTEGER CONSTRAINT PK PRIMARY KEY (K1,K2)) SALT_BUCKETS=4

DATA GENERATOR
STRING :: Values: A|B|C|D
STRING :: Length: 10 Values: SEQUENTIAL
STRING :: Length: 100 Values: RANDOM
STRING :: Length: 100 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM

QUERIES
select count(1) from SALTED_TABLE where K1 in ('A', 'B', 'C', 'D')
6.88s SNAPSHOT
7.41s PHOENIX-1.2.0
10.32s PHOENIX-1.1

select count(*) from SALTED_TABLE where D < 1000
2.66s SNAPSHOT
2.77s PHOENIX-1.2.0
14.31s PHOENIX-1.1

select avg(c),avg(d) from SALTED_TABLE group by K1
14.57s SNAPSHOT
14.7s PHOENIX-1.2.0
20.88s PHOENIX-1.1

LOAD DATA [10000000 ROWS]
387.64s SNAPSHOT
391.71s PHOENIX-1.2.0
384.16s PHOENIX-1.1


CF_TABLE_1CF
Same data as in 14 column family table but this one only has a single column family. Performance should be worse in most cases.

ROWS 10000000 [10M]

DDL CREATE TABLE IF NOT EXISTS $TABLE (K1 CHAR(1) NOT NULL, K2 VARCHAR NOT NULL, CF.A INTEGER, CF.B INTEGER, CF.C INTEGER, CF.D INTEGER, CF.E INTEGER, CF.F INTEGER, CF.G INTEGER, CF.H INTEGER, CF.I INTEGER, CF.J INTEGER, CF.K INTEGER, CF.L INTEGER, CF.M INTEGER, CF.N INTEGER CONSTRAINT PK PRIMARY KEY (K1,K2)) SPLIT ON ('B','C','D')

DATA GENERATOR
STRING :: Values: A|B|C|D
STRING :: Length: 10 Values: SEQUENTIAL
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM

QUERIES
select sum(a),sum(e),sum(j),sum(n) from CF_TABLE_1CF group by K1
32.5s SNAPSHOT
31.75s PHOENIX-1.2.0
31.49s PHOENIX-1.1

select count(1) from CF_TABLE_1CF where K1 in ('A', 'B', 'C', 'D')
10.2s SNAPSHOT
10.06s PHOENIX-1.2.0
10.29s PHOENIX-1.1

select count(*) from CF_TABLE_1CF where N < 1000
14.36s SNAPSHOT
14.02s PHOENIX-1.2.0
13.85s PHOENIX-1.1

select a,b,c,d,e,f,g,h,i,j,k,l,m,n from CF_TABLE_1CF where B>1000 and B<2000 and M>1000 and M<2000
16.52s SNAPSHOT
16.32s PHOENIX-1.2.0
72.19s PHOENIX-1.1

LOAD DATA [10000000 ROWS]
555.22s SNAPSHOT
556.14s PHOENIX-1.2.0
407.06s PHOENIX-1.1