Skip to content

Commit

Permalink
Increase example block size to 128 MiB.
Browse files Browse the repository at this point in the history
Signed-off-by: Pascal Spörri <[email protected]>
  • Loading branch information
pspoerri committed Sep 8, 2023
1 parent 7f6db51 commit 8712edc
Show file tree
Hide file tree
Showing 2 changed files with 5 additions and 2 deletions.
3 changes: 2 additions & 1 deletion examples/sql/run_benchmark.sh
Original file line number Diff line number Diff line change
Expand Up @@ -47,7 +47,7 @@ SPARK_HADOOP_S3A_CONFIG=(
--conf spark.hadoop.fs.s3a.endpoint=${S3A_ENDPOINT}
--conf spark.hadoop.fs.s3a.path.style.access=true
--conf spark.hadoop.fs.s3a.fast.upload=true
--conf spark.hadoop.fs.s3a.block.size=$((32*1024*1024))
--conf spark.hadoop.fs.s3a.block.size=$((128*1024*1024))
)

SPARK_S3_SHUFFLE_CONFIG=(
Expand Down Expand Up @@ -75,6 +75,7 @@ if (( "$USE_NFS_SHUFFLE" == 1 )); then
--conf spark.shuffle.s3.rootDir=file:///nfs/
--conf spark.kubernetes.executor.podTemplateFile=${SCRIPT_DIR}/../templates/executor_nfs.yml
--conf spark.kubernetes.driver.podTemplateFile=${SCRIPT_DIR}/../templates/driver_nfs.yml
--conf spark.hadoop.fs.file.block.size=$((128*1024*1024))
)
fi

Expand Down
4 changes: 3 additions & 1 deletion examples/terasort/run.sh
Original file line number Diff line number Diff line change
Expand Up @@ -45,7 +45,7 @@ SPARK_HADOOP_S3A_CONFIG=(
--conf spark.hadoop.fs.s3a.endpoint=${S3A_ENDPOINT}
--conf spark.hadoop.fs.s3a.path.style.access=true
--conf spark.hadoop.fs.s3a.fast.upload=true
--conf spark.hadoop.fs.s3a.block.size=$((32*1024*1024))
--conf spark.hadoop.fs.s3a.block.size=$((128*1024*1024))
)


Expand Down Expand Up @@ -76,6 +76,7 @@ if (( "$USE_NFS_SHUFFLE" == 1 )); then
--conf spark.shuffle.s3.rootDir=file:///nfs/
--conf spark.kubernetes.executor.podTemplateFile=${SCRIPT_DIR}/../templates/executor_nfs.yml
--conf spark.kubernetes.driver.podTemplateFile=${SCRIPT_DIR}/../templates/driver_nfs.yml
--conf spark.hadoop.fs.file.block.size=$((128*1024*1024))
)
fi

Expand Down Expand Up @@ -151,3 +152,4 @@ ${SPARK_HOME}/bin/spark-submit \
"s3a://${S3A_OUTPUT_BUCKET}/output/terasort/${SIZE}-${PROCESS_TAG}" "s3a://${S3A_OUTPUT_BUCKET}/output/terasort-validated/${SIZE}-${PROCESS_TAG}"

s3cmd rm -r s3://${S3A_OUTPUT_BUCKET}/output/terasort/${SIZE}-${PROCESS_TAG} || true

0 comments on commit 8712edc

Please sign in to comment.