Phoenix Performance Result :: Thu Jun 06 21:38:52 PDT 2013

AGGREGATION_TABLE
Various server side grouped/un-grouped aggregation functions. Data is pre-split in 9 regions over a 4 region server cluster.

ROWS 10000000 [10M]

DDL CREATE TABLE $TABLE (HOST CHAR(2) NOT NULL,DOMAIN VARCHAR NOT NULL,FEATURE VARCHAR NOT NULL,DATE DATE NOT NULL,USAGE.CORE BIGINT,USAGE.DB BIGINT,STATS.ACTIVE_VISITOR INTEGER CONSTRAINT PK PRIMARY KEY (HOST, DOMAIN, FEATURE, DATE)) SPLIT ON ('CSGoogle','CSSalesforce','EUApple','EUGoogle','EUSalesforce','NAApple','NAGoogle','NASalesforce')

DATA GENERATOR
STRING :: Values: NA|CS|EU
STRING :: Values: Salesforce.com|Apple.com|Google.com|Yelp.com
STRING :: Values: Login|Report|Dashboard|Sales|UI
DATE :: Values: SEQUENTIAL
INTEGER :: Max. Value: 100 Values: RANDOM
INTEGER :: Max. Value: 2000 Values: RANDOM
INTEGER :: Max. Value: 10000 Values: RANDOM

QUERIES
select trunc(date, 'hour', 1000), count(DB), count(ACTIVE_VISITOR) from AGGREGATION_TABLE where feature='Login' and (core<50 or db<20 or active_visitor > 200) group by trunc(date, 'hour', 1000)
8.31s SNAPSHOT
8.82s PHOENIX-1.2.0
12.97s PHOENIX-1.1

select round(date, 'day',50), sum(core)+2 from AGGREGATION_TABLE where (CORE<10 or CORE>90) group by round(date, 'day',50), host
6.4s SNAPSHOT
6.72s PHOENIX-1.2.0
6.76s PHOENIX-1.1

select count(1) from AGGREGATION_TABLE group by HOST
9.03s SNAPSHOT
9.14s PHOENIX-1.2.0
9.04s PHOENIX-1.1

select count(*) from AGGREGATION_TABLE
8.59s SNAPSHOT
8.67s PHOENIX-1.2.0
8.75s PHOENIX-1.1

select core, host, sum(ACTIVE_VISITOR) from AGGREGATION_TABLE group by core, host
14.87s SNAPSHOT
15.57s PHOENIX-1.2.0
15.43s PHOENIX-1.1

select core, count(1) from AGGREGATION_TABLE group by CORE
9.23s SNAPSHOT
9.47s PHOENIX-1.2.0
9.35s PHOENIX-1.1

select MIN(CORE) from AGGREGATION_TABLE group by DOMAIN
9.46s SNAPSHOT
9.7s PHOENIX-1.2.0
9.46s PHOENIX-1.1

select AVG(DB), MIN(CORE), MAX(ACTIVE_VISITOR) from AGGREGATION_TABLE where host='CS' and DOMAIN<>'Google.com'
18.38s SNAPSHOT
16.82s PHOENIX-1.2.0
16.44s PHOENIX-1.1

LOAD DATA [10000000 ROWS]
363.13s SNAPSHOT
359.93s PHOENIX-1.2.0
295.74s PHOENIX-1.1


IN_LIKE_TABLE
Phoenix 1.2+ uses skip scan that gives significant performance improvement for IN/LIKE queries.

ROWS 10000000 [10M]

DDL CREATE TABLE IF NOT EXISTS $TABLE (K1 CHAR(1) NOT NULL, K2 VARCHAR NOT NULL, CF.A INTEGER, CF.B VARCHAR, CF.C VARCHAR CONSTRAINT PK PRIMARY KEY (K1,K2)) SPLIT ON ('B','C','D','E','F','G','H','I')

DATA GENERATOR
STRING :: Values: A|B|C|D|E|F|G|H|I
STRING :: Length: 10 Values: SEQUENTIAL
INTEGER :: Max. Value: 1000000 Values: RANDOM
STRING :: Length: 50 Values: RANDOM
STRING :: Length: 50 Values: RANDOM

QUERIES
select count(1) from IN_LIKE_TABLE where K1 in ('Z', 'D', 'F', 'X')
3.66s SNAPSHOT
3.64s PHOENIX-1.2.0
3.88s PHOENIX-1.1

select count(*) from IN_LIKE_TABLE where K1 in ('X','A','B','C','D','E','F','G','H','I','Z') and K2 like '%1%'
5.7s SNAPSHOT
5.28s PHOENIX-1.2.0
4.91s PHOENIX-1.1

select count(*) from IN_LIKE_TABLE where (K1 in ('A','E','F','G','H','I','Z') or K1 like 'E%') and (K2 like '%xx1%' or K2 like '%xxxxxx2%')
5.62s SNAPSHOT
5.27s PHOENIX-1.2.0
4.98s PHOENIX-1.1

select * from IN_LIKE_TABLE where K1 in ('A','B') and K2 in ('xxx1000000','xxx2000000','xxx2000001')
0.01s SNAPSHOT
0.01s PHOENIX-1.2.0
5.99s PHOENIX-1.1

select * from IN_LIKE_TABLE where K1 in ('A', 'C', 'E', 'F', 'H') and K2 like 'xxxxxx1%'
0.02s SNAPSHOT
0.02s PHOENIX-1.2.0
25.45s PHOENIX-1.1

LOAD DATA [10000000 ROWS]
313.97s SNAPSHOT
313.19s PHOENIX-1.2.0
244.2s PHOENIX-1.1


CF_TABLE_14CF
Data is split in 14 column families. Phoenix 1.2+ uses Essential Column Family filter feature which fetches only required columns when filtering rows.

ROWS 10000000 [10M]

DDL CREATE TABLE IF NOT EXISTS $TABLE (K1 CHAR(1) NOT NULL, K2 VARCHAR NOT NULL, CF1.A INTEGER, CF2.B INTEGER, CF3.C INTEGER, CF4.D INTEGER, CF5.E INTEGER, CF6.F INTEGER, CF7.G INTEGER, CF8.H INTEGER, CF9.I INTEGER, CF10.J INTEGER, CF11.K INTEGER, CF12.L INTEGER, CF13.M INTEGER, CF14.N INTEGER CONSTRAINT PK PRIMARY KEY (K1,K2)) SPLIT ON ('B','C','D')

DATA GENERATOR
STRING :: Values: A|B|C|D
STRING :: Length: 10 Values: SEQUENTIAL
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM

QUERIES
select sum(a),sum(e),sum(j),sum(n) from CF_TABLE_14CF group by K1
37.93s SNAPSHOT
36.95s PHOENIX-1.2.0
35.35s PHOENIX-1.1

select count(1) from CF_TABLE_14CF where K1 in ('A', 'B', 'C', 'D')
12.39s SNAPSHOT
12.16s PHOENIX-1.2.0
12.4s PHOENIX-1.1

select count(*) from CF_TABLE_14CF where N < 1000
6.04s SNAPSHOT
6.17s PHOENIX-1.2.0
17.92s PHOENIX-1.1

select a,b,c,d,e,f,g,h,i,j,k,l,m,n from CF_TABLE_14CF where (B>1000 and B<2000) and (M>1000 and M<2000)
8.06s SNAPSHOT
8.26s PHOENIX-1.2.0
458.29s PHOENIX-1.1

LOAD DATA [10000000 ROWS]
650.11s SNAPSHOT
638.98s PHOENIX-1.2.0
478.73s PHOENIX-1.1


SALTED_TABLE
This is Phoenix 1.2+ feature. Data is split in 4 regions equal to number of region servers in test cluster by adding salted byte to each key.

ROWS 10000000 [10M]

DDL CREATE TABLE $TABLE (K1 CHAR(1) NOT NULL, K2 VARCHAR NOT NULL, CFA.A VARCHAR, CFA.B CHAR(100), CFA.C INTEGER, CFB.D INTEGER CONSTRAINT PK PRIMARY KEY (K1,K2)) SALT_BUCKETS=4

DATA GENERATOR
STRING :: Values: A|B|C|D
STRING :: Length: 10 Values: SEQUENTIAL
STRING :: Length: 100 Values: RANDOM
STRING :: Length: 100 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM

QUERIES
select count(1) from SALTED_TABLE where K1 in ('A', 'B', 'C', 'D')
7.05s SNAPSHOT
7.37s PHOENIX-1.2.0
21.49s PHOENIX-1.1

select count(*) from SALTED_TABLE where D < 1000
2.8s SNAPSHOT
2.74s PHOENIX-1.2.0
24.07s PHOENIX-1.1

select avg(c),avg(d) from SALTED_TABLE group by K1
15.32s SNAPSHOT
14.87s PHOENIX-1.2.0
27.57s PHOENIX-1.1

LOAD DATA [10000000 ROWS]
390.27s SNAPSHOT
386.94s PHOENIX-1.2.0
408.57s PHOENIX-1.1


CF_TABLE_1CF
Same data as in 14 column family table but this one only has a single column family. Performance should be worse in most cases.

ROWS 10000000 [10M]

DDL CREATE TABLE IF NOT EXISTS $TABLE (K1 CHAR(1) NOT NULL, K2 VARCHAR NOT NULL, CF.A INTEGER, CF.B INTEGER, CF.C INTEGER, CF.D INTEGER, CF.E INTEGER, CF.F INTEGER, CF.G INTEGER, CF.H INTEGER, CF.I INTEGER, CF.J INTEGER, CF.K INTEGER, CF.L INTEGER, CF.M INTEGER, CF.N INTEGER CONSTRAINT PK PRIMARY KEY (K1,K2)) SPLIT ON ('B','C','D')

DATA GENERATOR
STRING :: Values: A|B|C|D
STRING :: Length: 10 Values: SEQUENTIAL
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM

QUERIES
select sum(a),sum(e),sum(j),sum(n) from CF_TABLE_1CF group by K1
33.32s SNAPSHOT
33.73s PHOENIX-1.2.0
32.64s PHOENIX-1.1

select count(1) from CF_TABLE_1CF where K1 in ('A', 'B', 'C', 'D')
10.34s SNAPSHOT
11.01s PHOENIX-1.2.0
10.29s PHOENIX-1.1

select count(*) from CF_TABLE_1CF where N < 1000
14.67s SNAPSHOT
14.99s PHOENIX-1.2.0
14.58s PHOENIX-1.1

select a,b,c,d,e,f,g,h,i,j,k,l,m,n from CF_TABLE_1CF where B>1000 and B<2000 and M>1000 and M<2000
17.2s SNAPSHOT
17.38s PHOENIX-1.2.0
76.32s PHOENIX-1.1

LOAD DATA [10000000 ROWS]
565.34s SNAPSHOT
545.73s PHOENIX-1.2.0
400.5s PHOENIX-1.1