Skip to content

Commit 292c674

Browse files
committed
Params for Flink parallelism
1 parent afabd4e commit 292c674

File tree

4 files changed

+40
-21
lines changed

4 files changed

+40
-21
lines changed

Diff for: performance-tests/scaling/config.sh.tmpl

+1
Original file line numberDiff line numberDiff line change
@@ -7,6 +7,7 @@ export FHIR_UPLOADER_CORES=8
77
export ENABLE_UPLOAD=false
88
export ENABLE_DOWNLOAD=true
99
export JDBC_MODE=false
10+
# DirectRunner, FlinkRunner or DataflowRunner
1011
export FHIR_ETL_RUNNER=DataflowRunner
1112

1213
# pipeline-scaling-1, pipeline-scaling-2, pipeline-scaling-belgium

Diff for: performance-tests/scaling/setup_google3.sh

+2
Original file line numberDiff line numberDiff line change
@@ -10,13 +10,15 @@ set -o nounset
1010
case "$DB_TYPE" in
1111
"alloy")
1212
ALLOY_INSTANCE="projects/fhir-analytics-test/locations/us-central1/clusters/pipeline-scaling-alloydb-1/instances/pipeline-scaling-alloydb-largest"
13+
sudo killall alloydb-auth-proxy || true
1314
nohup ~/Downloads/alloydb-auth-proxy $ALLOY_INSTANCE &
1415
if [[ "$ENABLE_UPLOAD" = true ]]; then
1516
for cmd in "DROP DATABASE IF EXISTS" "CREATE DATABASE"; do
1617
PGPASSWORD="$DB_PASSWORD" psql -h 127.0.0.1 -p 5432 -U "$DB_USERNAME" -c "$cmd $DB_PATIENTS"
1718
done
1819
else
1920
# Check DB connection.
21+
sleep 1
2022
PGPASSWORD="$DB_PASSWORD" psql -h 127.0.0.1 -p 5432 -U "$DB_USERNAME" -c "SELECT 1"
2123
fi
2224
DB_CONNECTION="jdbc:postgresql:///${DB_PATIENTS}?127.0.0.1:5432"

Diff for: performance-tests/scaling/upload_download.py

+13-6
Original file line numberDiff line numberDiff line change
@@ -45,15 +45,22 @@ def download():
4545

4646
def run_fhir_etl(parquet_dir):
4747
common_etl_args = [
48-
"--fasterCopy=true",
4948
f"--runner={FHIR_ETL_RUNNER}",
5049
f"--resourceList=Patient,Encounter,Observation",
51-
f"--outputParquetPath={parquet_dir}",
52-
# Dataflow runner:
53-
f"--region={SQL_ZONE}",
54-
f"--numWorkers={NUM_WORKERS}",
55-
"--gcpTempLocation=gs://fhir-analytics-test/dataflow_temp"
50+
f"--outputParquetPath={parquet_dir}"
5651
]
52+
if FHIR_ETL_RUNNER == "DataflowRunner":
53+
common_etl_args.extend([
54+
f"--region={SQL_ZONE}",
55+
f"--numWorkers={NUM_WORKERS}",
56+
"--gcpTempLocation=gs://fhir-analytics-test/dataflow_temp",
57+
])
58+
if FHIR_ETL_RUNNER == "FlinkRunner":
59+
common_etl_args.extend([
60+
"--parallelism=100",
61+
"--maxParallelism=100",
62+
"--fasterCopy=true",
63+
])
5764

5865
if not JDBC_MODE:
5966
# Test HAPI server readiness.

Diff for: performance-tests/scaling/variables.sh

+24-15
Original file line numberDiff line numberDiff line change
@@ -7,25 +7,34 @@ export DB_PATIENTS="patients_$PATIENTS"
77
export DIR_WITH_THIS_SCRIPT
88
DIR_WITH_THIS_SCRIPT="$( cd -- "$(dirname "$0")" >/dev/null 2>&1 && pwd -P )"
99

10-
case "$POSTGRES_DB_INSTANCE" in
11-
"pipeline-scaling-belgium")
12-
export DB_USERNAME="postgres"
13-
export DB_PASSWORD="C%_/\Rn-=fI5f$}7"
14-
export ZONE=belgium
15-
;;
16-
"pipeline-scaling-1")
17-
export DB_USERNAME="pipeline-scaling-user"
18-
export DB_PASSWORD="C%_/\Rn-=fI5f$}7"
10+
export DB_USERNAME="postgres"
11+
export DB_PASSWORD="C%_/\Rn-=fI5f$}7"
12+
13+
case "$DB_TYPE" in
14+
"alloy")
1915
export ZONE=us-central
2016
;;
21-
"pipeline-scaling-2")
22-
export DB_USERNAME="postgres"
23-
export DB_PASSWORD="C%_/\Rn-=fI5f$}7"
24-
export ZONE=us-central
17+
"postgres")
18+
case "$POSTGRES_DB_INSTANCE" in
19+
"pipeline-scaling-belgium")
20+
export ZONE=belgium
21+
;;
22+
"pipeline-scaling-1")
23+
export DB_USERNAME="pipeline-scaling-user"
24+
export ZONE=us-central
25+
;;
26+
"pipeline-scaling-2")
27+
export ZONE=us-central
28+
;;
29+
*)
30+
echo "Invalid POSTGRES_DB_INSTANCE $POSTGRES_DB_INSTANCE"
31+
exit 2
32+
;;
33+
esac
2534
;;
2635
*)
27-
echo "Invalid POSTGRES_DB_INSTANCE $POSTGRES_DB_INSTANCE"
28-
exit 2
36+
echo "Invalid DB_TYPE DB_TYPE"
37+
exit 3
2938
;;
3039
esac
3140

0 commit comments

Comments
 (0)