From 1caf8b0f868e36f2405648efd51c1ddcffe1ae1b Mon Sep 17 00:00:00 2001 From: Peter Boyle Date: Tue, 28 Jan 2025 15:22:37 +0000 Subject: [PATCH] Rename --- systems/Aurora/benchmarks/gpu_tile.sh | 35 +++++++++++++++++++++++++++ 1 file changed, 35 insertions(+) create mode 100755 systems/Aurora/benchmarks/gpu_tile.sh diff --git a/systems/Aurora/benchmarks/gpu_tile.sh b/systems/Aurora/benchmarks/gpu_tile.sh new file mode 100755 index 00000000..8e485a06 --- /dev/null +++ b/systems/Aurora/benchmarks/gpu_tile.sh @@ -0,0 +1,35 @@ +#!/bin/bash + +#export NUMA_MAP=(2 2 2 3 3 3 2 2 2 3 3 3 ) +#export NUMA_MAP=(0 0 1 1 0 0 1 1 0 0 1 1); +#export GPU_MAP=(0.0 0.1 3.0 3.1 1.0 1.1 4.0 4.1 2.0 2.1 5.0 5.1) + +export NUMA_PMAP=(0 0 0 1 1 1 0 0 0 1 1 1 ); +export NUMA_MMAP=(2 2 2 3 3 3 3 2 2 2 2 3 3 3 ); +export GPU_MAP=(0.0 1.0 2.0 3.0 4.0 5.0 0.1 1.1 2.1 3.1 4.1 5.1 ) + +export NUMAP=${NUMA_PMAP[$PALS_LOCAL_RANKID]} +export NUMAM=${NUMA_PMAP[$PALS_LOCAL_RANKID]} +export gpu_id=${GPU_MAP[$PALS_LOCAL_RANKID]} + +unset EnableWalkerPartition +export EnableImplicitScaling=0 +export ZE_AFFINITY_MASK=$gpu_id +export ONEAPI_DEVICE_FILTER=gpu,level_zero + +export SYCL_PI_LEVEL_ZERO_DEVICE_SCOPE_EVENTS=0 +export SYCL_PI_LEVEL_ZERO_USE_IMMEDIATE_COMMANDLISTS=1 +export SYCL_PI_LEVEL_ZERO_USE_COPY_ENGINE=0:5 +export SYCL_PI_LEVEL_ZERO_USE_COPY_ENGINE_FOR_D2D_COPY=1 +#export SYCL_PI_LEVEL_ZERO_USE_COPY_ENGINE=0:2 +#export SYCL_PI_LEVEL_ZERO_USM_RESIDENT=1 + +echo "rank $PALS_RANKID ; local rank $PALS_LOCAL_RANKID ; ZE_AFFINITY_MASK=$ZE_AFFINITY_MASK ; NUMA $NUMA " + +if [ $PALS_RANKID = "0" ] +then +# numactl -m $NUMAM -N $NUMAP unitrace --chrome-kernel-logging --chrome-mpi-logging --chrome-sycl-logging --demangle "$@" + numactl -m $NUMAM -N $NUMAP "$@" +else + numactl -m $NUMAM -N $NUMAP "$@" +fi