From 16801825bf5d342c02c64b496687dc30f6423120 Mon Sep 17 00:00:00 2001 From: Santo Cariotti Date: Fri, 14 Feb 2025 23:24:57 +0100 Subject: Auto partitioner --- scripts/05-dataproc-submit.sh | 8 +------- 1 file changed, 1 insertion(+), 7 deletions(-) (limited to 'scripts/05-dataproc-submit.sh') diff --git a/scripts/05-dataproc-submit.sh b/scripts/05-dataproc-submit.sh index 5b2153e..6da9a29 100755 --- a/scripts/05-dataproc-submit.sh +++ b/scripts/05-dataproc-submit.sh @@ -6,12 +6,6 @@ if [ ${DEBUG:+1} ]; then set -xo pipefail fi -if [ "$#" -ne 1 ]; then - echo "Usage: 'sh ${PWD}/$0 '" - exit 1 -fi - -NUM_PARTITIONS="$1" INPUT_PATH="gs://${BUCKET_NAME}/input/" OUTPUT_PATH="gs://${BUCKET_NAME}/output" @@ -45,4 +39,4 @@ gcloud dataproc jobs submit spark \ --jar="gs://${BUCKET_NAME}/scala/co-purchase-analysis_2.12-1.0.jar" \ --region="${REGION}" \ --properties="spark.hadoop.fs.gs.impl=com.google.cloud.hadoop.fs.gcs.GoogleHadoopFileSystem" \ - -- "${INPUT_PATH}" "${OUTPUT_PATH}" "${NUM_PARTITIONS}" + -- "${INPUT_PATH}" "${OUTPUT_PATH}" -- cgit v1.2.3-18-g5258