Phoenix Performance Result :: Thu Jul 11 22:05:30 PDT 2013

AGGREGATION_TEST_TABLE
Various server side grouped/un-grouped aggregation functions. Data is pre-split in 9 regions over a 4 region server cluster.

ROWS 10000000 [10M]

DDL CREATE TABLE $TABLE (HOST CHAR(2) NOT NULL,DOMAIN VARCHAR NOT NULL,FEATURE VARCHAR NOT NULL,DATE DATE NOT NULL,USAGE.CORE BIGINT,USAGE.DB BIGINT,STATS.ACTIVE_VISITOR INTEGER CONSTRAINT PK PRIMARY KEY (HOST, DOMAIN, FEATURE, DATE)) SPLIT ON ('CSGoogle','CSSalesforce','EUApple','EUGoogle','EUSalesforce','NAApple','NAGoogle','NASalesforce')

DATA GENERATOR
STRING :: Values: NA|CS|EU
STRING :: Values: Salesforce.com|Apple.com|Google.com|Yelp.com
STRING :: Values: Login|Report|Dashboard|Sales|UI
DATE :: Values: SEQUENTIAL
INTEGER :: Max. Value: 100 Values: RANDOM
INTEGER :: Max. Value: 2000 Values: RANDOM
INTEGER :: Max. Value: 10000 Values: RANDOM

QUERIES
select count(*) from AGGREGATION_TEST_TABLE
6.83s CURRENT-SNAPSHOT
7.5s LAST-SNAPSHOT
7.16s PHOENIX-1.1
6.81s PHOENIX-1.2.0

select count(1) from AGGREGATION_TEST_TABLE group by HOST
7.3s CURRENT-SNAPSHOT
7.7s LAST-SNAPSHOT
7.28s PHOENIX-1.1
7.37s PHOENIX-1.2.0

select MIN(CORE) from AGGREGATION_TEST_TABLE group by DOMAIN
7.88s CURRENT-SNAPSHOT
8.59s LAST-SNAPSHOT
8.22s PHOENIX-1.1
8.33s PHOENIX-1.2.0

select core, count(1) from AGGREGATION_TEST_TABLE group by CORE
7.73s CURRENT-SNAPSHOT
8.13s LAST-SNAPSHOT
8.1s PHOENIX-1.1
8.12s PHOENIX-1.2.0

select core, host, sum(ACTIVE_VISITOR) from AGGREGATION_TEST_TABLE group by core, host
12.74s CURRENT-SNAPSHOT
13.29s LAST-SNAPSHOT
13.32s PHOENIX-1.1
13.04s PHOENIX-1.2.0

select AVG(DB), MIN(CORE), MAX(ACTIVE_VISITOR) from AGGREGATION_TEST_TABLE where host='CS' and DOMAIN<>'Google.com'
16.08s CURRENT-SNAPSHOT
18.29s LAST-SNAPSHOT
16s PHOENIX-1.1
17.74s PHOENIX-1.2.0

select round(date, 'day',50), sum(core)+2 from AGGREGATION_TEST_TABLE where (CORE<10 or CORE>90) group by round(date, 'day',50), host
5.46s CURRENT-SNAPSHOT
6.11s LAST-SNAPSHOT
5.48s PHOENIX-1.1
5.57s PHOENIX-1.2.0

select trunc(date, 'hour', 1000), count(DB), count(ACTIVE_VISITOR) from AGGREGATION_TEST_TABLE where feature='Login' and (core<50 or db<20 or active_visitor > 200) group by trunc(date, 'hour', 1000)
7.44s CURRENT-SNAPSHOT
8.03s LAST-SNAPSHOT
11.12s PHOENIX-1.1
7.61s PHOENIX-1.2.0

select count(active_visitor) count from AGGREGATION_TEST_TABLE
11.14s CURRENT-SNAPSHOT
11.98s LAST-SNAPSHOT
11.46s PHOENIX-1.1
11.5s PHOENIX-1.2.0

select count(distinct active_visitor) count from AGGREGATION_TEST_TABLE
12.58s CURRENT-SNAPSHOT
13.14s LAST-SNAPSHOT
N/A for PHOENIX-1.1
N/A for PHOENIX-1.2.0

select percentile_cont(0.9) within group (order by active_visitor asc) from AGGREGATION_TEST_TABLE
12.58s CURRENT-SNAPSHOT
13.19s LAST-SNAPSHOT
N/A for PHOENIX-1.1
N/A for PHOENIX-1.2.0

select percentile_cont(0.1) within group (order by active_visitor desc) from AGGREGATION_TEST_TABLE
12.5s CURRENT-SNAPSHOT
13.18s LAST-SNAPSHOT
N/A for PHOENIX-1.1
N/A for PHOENIX-1.2.0

select count(core), count(db), count(active_visitor) from AGGREGATION_TEST_TABLE
15.49s CURRENT-SNAPSHOT
16.5s LAST-SNAPSHOT
15.65s PHOENIX-1.1
15.72s PHOENIX-1.2.0

select count(distinct core), count(distinct db), count(distinct active_visitor) from AGGREGATION_TEST_TABLE
18.24s CURRENT-SNAPSHOT
18.85s LAST-SNAPSHOT
N/A for PHOENIX-1.1
N/A for PHOENIX-1.2.0

select percentile_cont(0.5) within group (order by core asc), percentile_cont(0.5) within group (order by db asc), percentile_cont(0.5) within group (order by active_visitor asc) from AGGREGATION_TEST_TABLE
18.22s CURRENT-SNAPSHOT
18.68s LAST-SNAPSHOT
N/A for PHOENIX-1.1
N/A for PHOENIX-1.2.0

select core, count(db) count from AGGREGATION_TEST_TABLE group by CORE
11.79s CURRENT-SNAPSHOT
12.16s LAST-SNAPSHOT
11.61s PHOENIX-1.1
11.88s PHOENIX-1.2.0

select core, count(distinct db) count from AGGREGATION_TEST_TABLE group by CORE
14.63s CURRENT-SNAPSHOT
15.2s LAST-SNAPSHOT
N/A for PHOENIX-1.1
N/A for PHOENIX-1.2.0

select core, percentile_cont(0.9999) within group (order by db asc) from AGGREGATION_TEST_TABLE group by CORE
14.78s CURRENT-SNAPSHOT
15.21s LAST-SNAPSHOT
N/A for PHOENIX-1.1
N/A for PHOENIX-1.2.0

LOAD DATA [10000000 ROWS]
319.76s CURRENT-SNAPSHOT
318.9s LAST-SNAPSHOT
293.01s PHOENIX-1.1
370.39s PHOENIX-1.2.0


IN_LIKE_TABLE
Phoenix 1.2+ uses skip scan that gives significant performance improvement for IN/LIKE queries.

ROWS 10000000 [10M]

DDL CREATE TABLE IF NOT EXISTS $TABLE (K1 CHAR(1) NOT NULL, K2 VARCHAR NOT NULL, CF.A INTEGER, CF.B VARCHAR, CF.C VARCHAR CONSTRAINT PK PRIMARY KEY (K1,K2)) SPLIT ON ('B','C','D','E','F','G','H','I')

DATA GENERATOR
STRING :: Values: A|B|C|D|E|F|G|H|I
STRING :: Length: 10 Values: SEQUENTIAL
INTEGER :: Max. Value: 1000000 Values: RANDOM
STRING :: Length: 50 Values: RANDOM
STRING :: Length: 50 Values: RANDOM

QUERIES
select count(1) from IN_LIKE_TABLE where K1 in ('Z', 'D', 'F', 'X')
3.44s CURRENT-SNAPSHOT
3.56s LAST-SNAPSHOT
3.7s PHOENIX-1.1
3.57s PHOENIX-1.2.0

select * from IN_LIKE_TABLE where K1 in ('A','B') and K2 in ('xxx1000000','xxx2000000','xxx2000001')
0.01s CURRENT-SNAPSHOT
0.01s LAST-SNAPSHOT
5.67s PHOENIX-1.1
0.01s PHOENIX-1.2.0

select * from IN_LIKE_TABLE where K1 in ('A', 'C', 'E', 'F', 'H') and K2 like 'xxxxxx1%'
0.01s CURRENT-SNAPSHOT
0.01s LAST-SNAPSHOT
24.57s PHOENIX-1.1
0.02s PHOENIX-1.2.0

select count(*) from IN_LIKE_TABLE where K1 in ('X','A','B','C','D','E','F','G','H','I','Z') and K2 like '%1%'
5.49s CURRENT-SNAPSHOT
5.29s LAST-SNAPSHOT
4.92s PHOENIX-1.1
5.53s PHOENIX-1.2.0

select count(*) from IN_LIKE_TABLE where (K1 in ('A','E','F','G','H','I','Z') or K1 like 'E%') and (K2 like '%xx1%' or K2 like '%xxxxxx2%')
5.26s CURRENT-SNAPSHOT
4.99s LAST-SNAPSHOT
5.05s PHOENIX-1.1
5.48s PHOENIX-1.2.0

LOAD DATA [10000000 ROWS]
253.65s CURRENT-SNAPSHOT
273.24s LAST-SNAPSHOT
233.34s PHOENIX-1.1
318.13s PHOENIX-1.2.0


CF_TABLE_14CF
Data is split in 14 column families. Phoenix 1.2+ uses Essential Column Family filter feature which fetches only required columns when filtering rows.

ROWS 10000000 [10M]

DDL CREATE TABLE IF NOT EXISTS $TABLE (K1 CHAR(1) NOT NULL, K2 VARCHAR NOT NULL, CF1.A INTEGER, CF2.B INTEGER, CF3.C INTEGER, CF4.D INTEGER, CF5.E INTEGER, CF6.F INTEGER, CF7.G INTEGER, CF8.H INTEGER, CF9.I INTEGER, CF10.J INTEGER, CF11.K INTEGER, CF12.L INTEGER, CF13.M INTEGER, CF14.N INTEGER CONSTRAINT PK PRIMARY KEY (K1,K2)) SPLIT ON ('B','C','D')

DATA GENERATOR
STRING :: Values: A|B|C|D
STRING :: Length: 10 Values: SEQUENTIAL
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM

QUERIES
select count(1) from CF_TABLE_14CF where K1 in ('A', 'B', 'C', 'D')
8.46s CURRENT-SNAPSHOT
8.19s LAST-SNAPSHOT
9.53s PHOENIX-1.1
8.46s PHOENIX-1.2.0

select count(1) from CF_TABLE_14CF where K1 in ('A', 'C')
8.48s CURRENT-SNAPSHOT
8.18s LAST-SNAPSHOT
9.52s PHOENIX-1.1
8.06s PHOENIX-1.2.0

select count(*) from CF_TABLE_14CF where N < 1000
4.18s CURRENT-SNAPSHOT
4.1s LAST-SNAPSHOT
13.93s PHOENIX-1.1
4.1s PHOENIX-1.2.0

select a,b,c,d,e,f,g,h,i,j,k,l,m,n from CF_TABLE_14CF where (B>1000 and B<2000) and (M>1000 and M<2000)
5.94s CURRENT-SNAPSHOT
5.96s LAST-SNAPSHOT
350.07s PHOENIX-1.1
6.01s PHOENIX-1.2.0

select sum(a),sum(e),sum(j),sum(n) from CF_TABLE_14CF group by K1
25.95s CURRENT-SNAPSHOT
25.94s LAST-SNAPSHOT
27.11s PHOENIX-1.1
25.84s PHOENIX-1.2.0

LOAD DATA [10000000 ROWS]
511.12s CURRENT-SNAPSHOT
555.12s LAST-SNAPSHOT
463.65s PHOENIX-1.1
666.43s PHOENIX-1.2.0


SALTED_TABLE
This is Phoenix 1.2+ feature. Data is split in 4 regions equal to number of region servers in test cluster by adding salted byte to each key.

ROWS 10000000 [10M]

DDL CREATE TABLE $TABLE (K1 CHAR(1) NOT NULL, K2 VARCHAR NOT NULL, CFA.A VARCHAR, CFA.B CHAR(100), CFA.C INTEGER, CFB.D INTEGER CONSTRAINT PK PRIMARY KEY (K1,K2)) SALT_BUCKETS=4

DATA GENERATOR
STRING :: Values: A|B|C|D
STRING :: Length: 10 Values: SEQUENTIAL
STRING :: Length: 100 Values: RANDOM
STRING :: Length: 100 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM

QUERIES
select count(1) from SALTED_TABLE where K1 in ('A', 'B', 'C', 'D')
5.81s CURRENT-SNAPSHOT
5.8s LAST-SNAPSHOT
20.43s PHOENIX-1.1
6.74s PHOENIX-1.2.0

select count(*) from SALTED_TABLE where D < 1000
2.2s CURRENT-SNAPSHOT
2.15s LAST-SNAPSHOT
24.37s PHOENIX-1.1
2.19s PHOENIX-1.2.0

select avg(c),avg(d) from SALTED_TABLE group by K1
12.14s CURRENT-SNAPSHOT
12.25s LAST-SNAPSHOT
34.55s PHOENIX-1.1
12.38s PHOENIX-1.2.0

LOAD DATA [10000000 ROWS]
326.7s CURRENT-SNAPSHOT
351.11s LAST-SNAPSHOT
438.89s PHOENIX-1.1
397.12s PHOENIX-1.2.0


CF_TABLE_1CF
Same data as in 14 column family table but this one only has a single column family. Performance should be worse in most cases.

ROWS 10000000 [10M]

DDL CREATE TABLE IF NOT EXISTS $TABLE (K1 CHAR(1) NOT NULL, K2 VARCHAR NOT NULL, CF.A INTEGER, CF.B INTEGER, CF.C INTEGER, CF.D INTEGER, CF.E INTEGER, CF.F INTEGER, CF.G INTEGER, CF.H INTEGER, CF.I INTEGER, CF.J INTEGER, CF.K INTEGER, CF.L INTEGER, CF.M INTEGER, CF.N INTEGER CONSTRAINT PK PRIMARY KEY (K1,K2)) SPLIT ON ('B','C','D')

DATA GENERATOR
STRING :: Values: A|B|C|D
STRING :: Length: 10 Values: SEQUENTIAL
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM
INTEGER :: Max. Value: 1000000 Values: RANDOM

QUERIES
select count(1) from CF_TABLE_1CF where K1 in ('A', 'B', 'C', 'D')
8.67s CURRENT-SNAPSHOT
9s LAST-SNAPSHOT
8.88s PHOENIX-1.1
8.71s PHOENIX-1.2.0

select count(1) from CF_TABLE_1CF where K1 in ('A', 'C')
8.06s CURRENT-SNAPSHOT
8.55s LAST-SNAPSHOT
8.45s PHOENIX-1.1
8.75s PHOENIX-1.2.0

select count(*) from CF_TABLE_1CF where N < 1000
11.48s CURRENT-SNAPSHOT
11.89s LAST-SNAPSHOT
11.11s PHOENIX-1.1
12.08s PHOENIX-1.2.0

select a,b,c,d,e,f,g,h,i,j,k,l,m,n from CF_TABLE_1CF where B>1000 and B<2000 and M>1000 and M<2000
13.69s CURRENT-SNAPSHOT
13.75s LAST-SNAPSHOT
62.04s PHOENIX-1.1
14.86s PHOENIX-1.2.0

select sum(a),sum(e),sum(j),sum(n) from CF_TABLE_1CF group by K1
25.38s CURRENT-SNAPSHOT
25.37s LAST-SNAPSHOT
24.98s PHOENIX-1.1
26.9s PHOENIX-1.2.0

LOAD DATA [10000000 ROWS]
437.16s CURRENT-SNAPSHOT
479.68s LAST-SNAPSHOT
390.17s PHOENIX-1.1
565.81s PHOENIX-1.2.0