Skip to content

Commit fe8ee3b

Browse files
committed
Merge branch 'spark2a-template' into 'main'
Update to spark2a templates Closes #2 and #1 See merge request nvspark/nds!5
2 parents deafb01 + f12e50a commit fe8ee3b

File tree

2 files changed

+59
-24
lines changed

2 files changed

+59
-24
lines changed

power_run_cpu.template

Lines changed: 34 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,34 @@
1+
#
2+
# SPDX-FileCopyrightText: Copyright (c) 2022 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
3+
# SPDX-License-Identifier: Apache-2.0
4+
#
5+
# Licensed under the Apache License, Version 2.0 (the "License");
6+
# you may not use this file except in compliance with the License.
7+
# You may obtain a copy of the License at
8+
#
9+
# http://www.apache.org/licenses/LICENSE-2.0
10+
#
11+
# Unless required by applicable law or agreed to in writing, software
12+
# distributed under the License is distributed on an "AS IS" BASIS,
13+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
14+
# See the License for the specific language governing permissions and
15+
# limitations under the License.
16+
#
17+
export CUDF_JAR=cudf-22.02.0.jar
18+
export SPARK_RAPIDS_PLUGIN_JAR=rapids-4-spark_2.12-22.02.0.jar
19+
export SPARK_HOME=/usr/lib/spark
20+
$SPARK_HOME/bin/spark-shell \
21+
--master yarn \
22+
--conf spark.rapids.sql.enabled=false \
23+
--conf spark.executor.cores=16 \
24+
--conf spark.executor.memory=16G \
25+
--conf spark.driver.memory=50G \
26+
--conf spark.sql.adaptive.enabled=true \
27+
--conf spark.locality.wait=0 \
28+
--conf spark.sql.shuffle.partitions=128 \
29+
--conf spark.executor.instances=8 \
30+
--conf spark.dynamicAllocation.enabled=false \
31+
--conf spark.scheduler.mode=FIFO \
32+
--conf spark.sql.autoBroadcastJoinThreshold=10m \
33+
--conf spark.scheduler.minRegisteredResourcesRatio=1.0 \
34+
--conf spark.sql.broadcastTimeout=1200 \

power_run_gpu.template

Lines changed: 25 additions & 24 deletions
Original file line numberDiff line numberDiff line change
@@ -16,28 +16,29 @@
1616
#
1717
export CUDF_JAR=cudf-22.02.0.jar
1818
export SPARK_RAPIDS_PLUGIN_JAR=rapids-4-spark_2.12-22.02.0.jar
19-
export SPARK_HOME=YOUR_SPARK_HOME
19+
export SPARK_HOME=/usr/lib/spark
2020
$SPARK_HOME/bin/spark-shell \
21-
--master YOUR_SPARK_MASTER \
22-
--driver-memory 10G \
23-
--num-executors 1 \
24-
--executor-memory 40G \
25-
--executor-cores 12 \
26-
--conf spark.task.cpus=1 \
27-
--conf spark.task.resource.gpu.amount=0.05 \
28-
--conf spark.rapids.sql.concurrentGpuTasks=2 \
29-
--conf spark.plugins=com.nvidia.spark.SQLPlugin \
30-
--conf spark.sql.files.maxPartitionBytes=2g \
31-
--conf spark.rapids.memory.pinnedPool.size=8g \
32-
--conf spark.rapids.sql.explain=NOT_ON_GPU \
33-
--conf spark.rapids.sql.incompatibleOps.enabled=true \
34-
--conf spark.rapids.sql.variableFloatAgg.enabled=true \
35-
--conf spark.rapids.sql.csv.read.date.enabled=true \
36-
--conf spark.rapids.sql.csvTimestamps.enabled=false \
37-
--conf spark.rapids.sql.csv.read.integer.enabled=true \
38-
--conf spark.sql.legacy.parquet.datetimeRebaseModeInWrite=CORRECTED \
39-
--conf spark.rapids.sql.castFloatToDecimal.enabled=true \
40-
--conf spark.executor.resource.gpu.amount=1 \
41-
--conf spark.executor.resource.gpu.discoveryScript=./getGpusResources.sh \
42-
--files $SPARK_HOME/examples/src/main/scripts/getGpusResources.sh \
43-
--jars $SPARK_RAPIDS_PLUGIN_JAR,$CUDF_JAR \
21+
--master yarn \
22+
--conf spark.rapids.memory.gpu.pool=ARENA \
23+
--conf spark.rapids.sql.batchSizeBytes=1GB \
24+
--conf spark.driver.maxResultSize=2GB \
25+
--conf spark.executor.instances=8 \
26+
--conf spark.executor.cores=16 \
27+
--conf spark.locality.wait=0 \
28+
--conf spark.rapids.sql.concurrentGpuTasks=2 \
29+
--conf spark.executor.resource.gpu.amount=1 \
30+
--conf spark.task.resource.gpu.amount=0.0625 \
31+
--conf spark.executor.memory=16G \
32+
--conf spark.driver.memory=50G \
33+
--conf spark.sql.shuffle.partitions=200 \
34+
--conf spark.sql.files.maxPartitionBytes=2gb \
35+
--conf spark.driver.extraClassPath=$SPARK_RAPIDS_PLUGIN_JAR:$CUDF_JAR \
36+
--conf spark.executor.extraClassPath=$SPARK_RAPIDS_PLUGIN_JAR:$CUDF_JAR \
37+
--conf spark.executor.extraJavaOptions=-Dai.rapids.cudf.nvtx.enabled=true \
38+
--conf spark.rapids.memory.host.spillStorageSize=32G \
39+
--conf spark.sql.adaptive.enabled=true \
40+
--conf spark.plugins=com.nvidia.spark.SQLPlugin \
41+
--conf spark.rapids.memory.pinnedPool.size=8g \
42+
--conf spark.rapids.shuffle.maxMetadataSize=512KB \
43+
--conf spark.executor.resource.gpu.discoveryScript=./getGpusResources.sh \
44+
--files $SPARK_HOME/examples/src/main/scripts/getGpusResources.sh \

0 commit comments

Comments
 (0)