Skip to content

Commit 88478c8

Browse files
Merge pull request #458 from ClickHouse/faster-init
Faster initialization
2 parents e1be252 + 8a3c160 commit 88478c8

42 files changed

Lines changed: 126 additions & 84 deletions

File tree

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

cedardb/benchmark.sh

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -6,9 +6,10 @@ sudo apt-get install -y docker.io postgresql-client gzip
66

77
# download dataset
88
echo "Downloading dataset..."
9-
wget --continue --progress=dot:giga 'https://datasets.clickhouse.com/hits_compatible/hits.tsv.gz'
9+
sudo apt-get install -y axel pigz
10+
axel --num-connections=32 'https://datasets.clickhouse.com/hits_compatible/hits.tsv.gz'
1011
echo "Unpacking dataset..."
11-
gzip -d hits.tsv.gz
12+
pigz -d -f hits.tsv.gz
1213
mkdir data
1314
mv hits.tsv data
1415
chmod -R 777 data

chdb/benchmark.sh

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -7,8 +7,9 @@ pip install psutil
77
pip install chdb
88

99
# Load the data
10-
wget --continue --progress=dot:giga 'https://datasets.clickhouse.com/hits_compatible/hits.csv.gz'
11-
gzip -d -f hits.csv.gz
10+
sudo apt-get install -y axel pigz
11+
axel --num-connections=32 'https://datasets.clickhouse.com/hits_compatible/hits.csv.gz'
12+
pigz -d -f hits.csv.gz
1213
./load.py
1314

1415
# Run the queries

citus/benchmark.sh

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -6,8 +6,9 @@ sudo apt-get install -y postgresql-client
66

77
sudo docker run -d --name citus -p 5432:5432 -e POSTGRES_PASSWORD=mypass citusdata/citus:11.0
88

9-
wget --continue --progress=dot:giga 'https://datasets.clickhouse.com/hits_compatible/hits.tsv.gz'
10-
gzip -d -f hits.tsv.gz
9+
sudo apt-get install -y axel pigz
10+
axel --num-connections=32 'https://datasets.clickhouse.com/hits_compatible/hits.tsv.gz'
11+
pigz -d -f hits.tsv.gz
1112

1213
echo "*:*:*:*:mypass" > .pgpass
1314
chmod 400 .pgpass

clickhouse-tencent/benchmark.sh

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -19,8 +19,9 @@ clickhouse-client < create.sql
1919

2020
if [ ! -f hits.tsv ]
2121
then
22-
wget --continue --progress=dot:giga 'https://datasets.clickhouse.com/hits_compatible/hits.tsv.gz'
23-
gzip -d -f hits.tsv.gz
22+
sudo apt-get install -y axel pigz
23+
axel --num-connections=32 'https://datasets.clickhouse.com/hits_compatible/hits.tsv.gz'
24+
pigz -d -f hits.tsv.gz
2425
fi
2526

2627
clickhouse-client --time --query "INSERT INTO hits FORMAT TSV" < hits.tsv

clickhouse/benchmark.sh

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -39,8 +39,9 @@ clickhouse-client < create"$SUFFIX".sql
3939

4040
if [ ! -f hits.tsv ]
4141
then
42-
wget --continue --progress=dot:giga 'https://datasets.clickhouse.com/hits_compatible/hits.tsv.gz'
43-
gzip -d -f hits.tsv.gz
42+
sudo apt-get install -y axel pigz
43+
axel --num-connections=32 'https://datasets.clickhouse.com/hits_compatible/hits.tsv.gz'
44+
pigz -d -f hits.tsv.gz
4445
fi
4546

4647
echo -n "Load time: "

databend/benchmark.sh

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -26,8 +26,9 @@ CONF
2626
# Docs: https://databend.rs/doc/use-cases/analyze-hits-dataset-with-databend
2727
curl 'http://default@localhost:8124/' --data-binary @create.sql
2828

29-
wget --continue --progress=dot:giga 'https://datasets.clickhouse.com/hits_compatible/hits.tsv.gz'
30-
gzip -d hits.tsv.gz
29+
sudo apt-get install -y axel pigz
30+
axel --num-connections=32 'https://datasets.clickhouse.com/hits_compatible/hits.tsv.gz'
31+
pigz -d -f hits.tsv.gz
3132

3233
## Aws gp2 write performance is not stable, we must load the data when disk's write around ~500MB/s (Don't know much about the rules of gp2)
3334
time curl -XPUT 'http://root:@127.0.0.1:8000/v1/streaming_load' -H 'insert_sql: insert into hits FILE_FORMAT = (type = TSV)' -F 'upload=@"./hits.tsv"'

doris/benchmark.sh

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -88,8 +88,9 @@ mysql -h 127.0.0.1 -P9030 -uroot hits <"$ROOT"/create.sql
8888

8989
# Download data
9090
if [[ ! -f hits.tsv.gz ]] && [[ ! -f hits.tsv ]]; then
91-
wget --continue --progress=dot:giga 'https://datasets.clickhouse.com/hits_compatible/hits.tsv.gz'
92-
gzip -d -f hits.tsv.gz
91+
sudo apt-get install -y axel pigz
92+
axel --num-connections=32 'https://datasets.clickhouse.com/hits_compatible/hits.tsv.gz'
93+
pigz -d -f hits.tsv.gz
9394
fi
9495

9596
# Load data

druid/benchmark.sh

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -26,8 +26,9 @@ echo "druid.query.groupBy.maxMergingDictionarySize=5000000000" >> apache-druid-$
2626

2727
# Load the data
2828

29-
wget --continue --progress=dot:giga 'https://datasets.clickhouse.com/hits_compatible/hits.tsv.gz'
30-
gzip -d -f hits.tsv.gz
29+
sudo apt-get install -y axel pigz
30+
axel --num-connections=32 'https://datasets.clickhouse.com/hits_compatible/hits.tsv.gz'
31+
pigz -d -f hits.tsv.gz
3132

3233
./apache-druid-${VERSION}/bin/post-index-task --file ingest.json --url http://localhost:8081
3334

duckdb-memory/benchmark.sh

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -8,8 +8,9 @@ pip install duckdb==1.1.3 psutil
88

99
# Load the data
1010

11-
wget --continue --progress=dot:giga 'https://datasets.clickhouse.com/hits_compatible/hits.csv.gz'
12-
gzip -d -f hits.csv.gz
11+
sudo apt-get install -y axel pigz
12+
axel --num-connections=32 'https://datasets.clickhouse.com/hits_compatible/hits.csv.gz'
13+
pigz -d -f hits.csv.gz
1314

1415
# Run the queries
1516

duckdb/benchmark.sh

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -14,8 +14,9 @@ export PATH="$PATH:`pwd`/build/release/"
1414
cd ..
1515

1616
# Load the data
17-
wget --continue --progress=dot:giga 'https://datasets.clickhouse.com/hits_compatible/hits.tsv.gz'
18-
gzip -d hits.tsv.gz
17+
sudo apt-get install -y axel pigz
18+
axel --num-connections=32 'https://datasets.clickhouse.com/hits_compatible/hits.tsv.gz'
19+
pigz -d -f hits.tsv.gz
1920

2021
time duckdb hits.db -f create.sql -c "COPY hits FROM 'hits.tsv' (QUOTE '')"
2122

0 commit comments

Comments
 (0)