From 6d0c2de3996062be45a0911a4431e013321b1bbe Mon Sep 17 00:00:00 2001 From: Peter Boyle Date: Tue, 3 Oct 2023 17:04:20 +0000 Subject: [PATCH] Deprecate teh PVC directory and make a PVC-OEM generic PVC target with no queueing system dependency -- just interactive scripts --- systems/{OEM => PVC-OEM}/README | 0 systems/{OEM => PVC-OEM}/benchmarks/bench.sh | 0 .../{OEM => PVC-OEM}/benchmarks/select_gpu.sh | 0 systems/{OEM => PVC-OEM}/config-command | 0 systems/{OEM => PVC-OEM}/setup.sh | 0 systems/PVC/benchmarks/run-1tile.sh | 62 ------------------- systems/PVC/benchmarks/run-2tile-mpi.sh | 33 ---------- systems/PVC/benchmarks/wrap.sh | 9 --- systems/PVC/config-command | 16 ----- systems/PVC/setup.sh | 18 ------ 10 files changed, 138 deletions(-) rename systems/{OEM => PVC-OEM}/README (100%) rename systems/{OEM => PVC-OEM}/benchmarks/bench.sh (100%) rename systems/{OEM => PVC-OEM}/benchmarks/select_gpu.sh (100%) rename systems/{OEM => PVC-OEM}/config-command (100%) rename systems/{OEM => PVC-OEM}/setup.sh (100%) delete mode 100755 systems/PVC/benchmarks/run-1tile.sh delete mode 100755 systems/PVC/benchmarks/run-2tile-mpi.sh delete mode 100755 systems/PVC/benchmarks/wrap.sh delete mode 100644 systems/PVC/config-command delete mode 100644 systems/PVC/setup.sh diff --git a/systems/OEM/README b/systems/PVC-OEM/README similarity index 100% rename from systems/OEM/README rename to systems/PVC-OEM/README diff --git a/systems/OEM/benchmarks/bench.sh b/systems/PVC-OEM/benchmarks/bench.sh similarity index 100% rename from systems/OEM/benchmarks/bench.sh rename to systems/PVC-OEM/benchmarks/bench.sh diff --git a/systems/OEM/benchmarks/select_gpu.sh b/systems/PVC-OEM/benchmarks/select_gpu.sh similarity index 100% rename from systems/OEM/benchmarks/select_gpu.sh rename to systems/PVC-OEM/benchmarks/select_gpu.sh diff --git a/systems/OEM/config-command b/systems/PVC-OEM/config-command similarity index 100% rename from systems/OEM/config-command rename to systems/PVC-OEM/config-command diff --git a/systems/OEM/setup.sh b/systems/PVC-OEM/setup.sh similarity index 100% rename from systems/OEM/setup.sh rename to systems/PVC-OEM/setup.sh diff --git a/systems/PVC/benchmarks/run-1tile.sh b/systems/PVC/benchmarks/run-1tile.sh deleted file mode 100755 index 9a29b773..00000000 --- a/systems/PVC/benchmarks/run-1tile.sh +++ /dev/null @@ -1,62 +0,0 @@ -#!/bin/sh -##SBATCH -p PVC-SPR-QZEH -##SBATCH -p PVC-ICX-QZNW -#SBATCH -p QZ1J-ICX-PVC -##SBATCH -p QZ1J-SPR-PVC-2C - -#source /nfs/site/home/paboylex/ATS/GridNew/Grid/systems/PVC-nightly/setup.sh - -export NT=8 - -export I_MPI_OFFLOAD=1 -export I_MPI_OFFLOAD_TOPOLIB=level_zero -export I_MPI_OFFLOAD_DOMAIN_SIZE=-1 - -# export IGC_EnableLSCFenceUGMBeforeEOT=0 -# export SYCL_PROGRAM_COMPILE_OPTIONS="-ze-opt-large-register-file=False" -export SYCL_DEVICE_FILTER=gpu,level_zero -#export IGC_ShaderDumpEnable=1 -#export IGC_DumpToCurrentDir=1 -export I_MPI_OFFLOAD_CELL=tile -export EnableImplicitScaling=0 -export EnableWalkerPartition=0 -export ZE_AFFINITY_MASK=0.0 -mpiexec -launcher ssh -n 1 -host localhost ./Benchmark_dwf_fp32 --mpi 1.1.1.1 --grid 32.32.32.32 --accelerator-threads $NT --comms-sequential --shm-mpi 1 --device-mem 32768 - -export ZE_AFFINITY_MASK=0 -export I_MPI_OFFLOAD_CELL=device -export EnableImplicitScaling=1 -export EnableWalkerPartition=1 - - - - - - - - - - - - - - - - - - - - -#mpiexec -launcher ssh -n 2 -host localhost vtune -collect gpu-hotspots -knob gpu-sampling-interval=1 -data-limit=0 -r ./vtune_run4 -- ./wrap.sh ./Benchmark_dwf_fp32 --mpi 2.1.1.1 --grid 64.32.32.32 --accelerator-threads $NT --comms-overlap --shm-mpi 1 - -#mpiexec -launcher ssh -n 1 -host localhost ./wrap.sh ./Benchmark_dwf_fp32 --mpi 1.1.1.1 --grid 64.32.32.32 --accelerator-threads $NT --comms-overlap --shm-mpi 1 - -#mpiexec -launcher ssh -n 2 -host localhost ./wrap.sh ./Benchmark_dwf_fp32 --mpi 2.1.1.1 --grid 64.32.32.32 --accelerator-threads $NT --comms-sequential --shm-mpi 1 - -#mpiexec -launcher ssh -n 2 -host localhost ./wrap.sh ./Benchmark_dwf_fp32 --mpi 2.1.1.1 --grid 64.32.32.32 --accelerator-threads $NT --comms-overlap --shm-mpi 1 - -#mpiexec -launcher ssh -n 2 -host localhost ./wrap.sh ./Benchmark_dwf_fp32 --mpi 2.1.1.1 --grid 64.32.32.32 --accelerator-threads $NT --comms-sequential --shm-mpi 0 - -#mpirun -np 2 ./wrap.sh ./Benchmark_dwf_fp32 --mpi 1.1.1.2 --grid 16.32.32.64 --accelerator-threads $NT --comms-sequential --shm-mpi 0 -#mpirun -np 2 ./wrap.sh ./Benchmark_dwf_fp32 --mpi 1.1.1.2 --grid 32.32.32.64 --accelerator-threads $NT --comms-sequential --shm-mpi 1 - diff --git a/systems/PVC/benchmarks/run-2tile-mpi.sh b/systems/PVC/benchmarks/run-2tile-mpi.sh deleted file mode 100755 index 1db67508..00000000 --- a/systems/PVC/benchmarks/run-2tile-mpi.sh +++ /dev/null @@ -1,33 +0,0 @@ -#!/bin/bash -##SBATCH -p PVC-SPR-QZEH -##SBATCH -p PVC-ICX-QZNW - -#SBATCH -p QZ1J-ICX-PVC - -#source /nfs/site/home/paboylex/ATS/GridNew/Grid/systems/PVC-nightly/setup.sh - -export NT=16 - -# export IGC_EnableLSCFenceUGMBeforeEOT=0 -# export SYCL_PROGRAM_COMPILE_OPTIONS="-ze-opt-large-register-file=False" -#export IGC_ShaderDumpEnable=1 -#export IGC_DumpToCurrentDir=1 -export I_MPI_OFFLOAD=1 -export I_MPI_OFFLOAD_TOPOLIB=level_zero -export I_MPI_OFFLOAD_DOMAIN_SIZE=-1 -export SYCL_DEVICE_FILTER=gpu,level_zero -export I_MPI_OFFLOAD_CELL=tile -export EnableImplicitScaling=0 -export EnableWalkerPartition=0 -#export SYCL_PI_LEVEL_ZERO_DEVICE_SCOPE_EVENTS=1 -#export SYCL_PI_LEVEL_ZERO_USE_IMMEDIATE_COMMANDLISTS=1 -export SYCL_PI_LEVEL_ZERO_USE_COPY_ENGINE=0 - -for i in 0 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 -do -mpiexec -launcher ssh -n 2 -host localhost ./wrap.sh ./Benchmark_dwf_fp32 --mpi 1.1.1.2 --grid 32.32.32.64 --accelerator-threads $NT --shm-mpi 0 --device-mem 32768 > 1.1.1.2.log$i -mpiexec -launcher ssh -n 2 -host localhost ./wrap.sh ./Benchmark_dwf_fp32 --mpi 2.1.1.1 --grid 64.32.32.32 --accelerator-threads $NT --shm-mpi 0 --device-mem 32768 > 2.1.1.1.log$i -done - -mpiexec -launcher ssh -n 2 -host localhost ./wrap.sh ./Benchmark_dwf_fp32 --mpi 2.1.1.1 --grid 64.32.32.32 --accelerator-threads $NT --comms-sequential --shm-mpi 0 - diff --git a/systems/PVC/benchmarks/wrap.sh b/systems/PVC/benchmarks/wrap.sh deleted file mode 100755 index b8806b30..00000000 --- a/systems/PVC/benchmarks/wrap.sh +++ /dev/null @@ -1,9 +0,0 @@ -#!/bin/sh - -export ZE_AFFINITY_MASK=0.$MPI_LOCALRANKID - -echo Ranke $MPI_LOCALRANKID ZE_AFFINITY_MASK is $ZE_AFFINITY_MASK - - - $@ - diff --git a/systems/PVC/config-command b/systems/PVC/config-command deleted file mode 100644 index c3523c2d..00000000 --- a/systems/PVC/config-command +++ /dev/null @@ -1,16 +0,0 @@ -INSTALL=/nfs/site/home/paboylx/prereqs/ -../../configure \ - --enable-simd=GPU \ - --enable-gen-simd-width=64 \ - --enable-comms=mpi-auto \ - --disable-accelerator-cshift \ - --disable-gparity \ - --disable-fermion-reps \ - --enable-shm=nvlink \ - --enable-accelerator=sycl \ - --enable-unified=no \ - MPICXX=mpicxx \ - CXX=dpcpp \ - LDFLAGS="-fsycl-device-code-split=per_kernel -fsycl-device-lib=all -lze_loader -L$INSTALL/lib" \ - CXXFLAGS="-fsycl-unnamed-lambda -fsycl -no-fma -I$INSTALL/include -Wno-tautological-compare" - diff --git a/systems/PVC/setup.sh b/systems/PVC/setup.sh deleted file mode 100644 index c3b97ce0..00000000 --- a/systems/PVC/setup.sh +++ /dev/null @@ -1,18 +0,0 @@ -export https_proxy=http://proxy-chain.intel.com:911 -#export LD_LIBRARY_PATH=/nfs/site/home/azusayax/install/lib:$LD_LIBRARY_PATH -export LD_LIBRARY_PATH=$HOME/prereqs/lib/:$LD_LIBRARY_PATH - -module load intel-release -module load intel-comp-rt/embargo-ci-neo - -#source /opt/intel/oneapi/PVC_setup.sh -#source /opt/intel/oneapi/ATS_setup.sh -#module load intel-nightly/20230331 -#module load intel-comp-rt/ci-neo-master/026093 - -#module load intel/mpich -module load intel/mpich/pvc45.3 -export PATH=~/ATS/pti-gpu/tools/onetrace/:$PATH - -#clsh embargo-ci-neo-022845 -#source /opt/intel/vtune_amplifier/amplxe-vars.sh