Skip to content
GitLab
Explore
Sign in
Primary navigation
Search or go to…
Project
P
Perlmutter_GPU_queue_tensorflow
Manage
Activity
Members
Labels
Plan
Issues
Issue boards
Milestones
Iterations
Requirements
Code
Merge requests
Repository
Branches
Commits
Tags
Repository graph
Compare revisions
Locked files
Build
Pipelines
Jobs
Pipeline schedules
Test cases
Artifacts
Deploy
Releases
Package registry
Container registry
Model registry
Operate
Environments
Terraform modules
Monitor
Incidents
Analyze
Value stream analytics
Contributor analytics
CI/CD analytics
Repository analytics
Code review analytics
Issue analytics
Insights
Model experiments
Help
Help
Support
GitLab documentation
Compare GitLab plans
Community forum
Contribute to GitLab
Provide feedback
Keyboard shortcuts
?
Snippets
Groups
Projects
Show more breadcrumbs
Argonne_computing
HPCOps
Examples
Perlmutter_GPU_queue_tensorflow
Commits
30109790
Commit
30109790
authored
2 years ago
by
Rui Wang
Browse files
Options
Downloads
Patches
Plain Diff
Clean up
parent
8370f743
No related branches found
No related tags found
No related merge requests found
Changes
3
Hide whitespace changes
Inline
Side-by-side
Showing
3 changed files
.asetup.save
+0
-90
0 additions, 90 deletions
.asetup.save
sub.sh
+1
-20
1 addition, 20 deletions
sub.sh
submit.sh
+0
-31
0 additions, 31 deletions
submit.sh
with
1 addition
and
141 deletions
.asetup.save
deleted
100755 → 0
+
0
−
90
View file @
8370f743
#Release cmake
export LANG="C"
export LC_ALL="C"
export COOL_ORA_ENABLE_ADAPTIVE_OPT="Y"
export ASETUP_PRINTLEVEL="0"
export BINARY_TAG="x86_64-centos7-gcc11-opt"
export CMTCONFIG="x86_64-centos7-gcc11-opt"
export ASETUP_SYSBIN=`mktemp -d /tmp/elmsheus/.asetup-sysbin-XXXXXX_$$`
source $AtlasSetup/scripts/sys_exe-alias.sh ''
if [ -n "${MAKEFLAGS:+x}" ]; then
asetup_flags=`echo ${MAKEFLAGS} | \grep ' -l'`
if [ -z "${asetup_flags}" ]; then
export MAKEFLAGS="${MAKEFLAGS} -l16"
fi
else
export MAKEFLAGS="-j16 -l16"
fi
source /cvmfs/sft.cern.ch/lcg/releases/gcc/11.2.0-8a51a/x86_64-centos7/setup.sh
export CC=`\env which gcc 2>/dev/null`
[[ -z $CC ]] && unset CC
export CXX=`\env which g++ 2>/dev/null`
[[ -z $CXX ]] && unset CXX
export FC=`\env which gfortran 2>/dev/null`
[[ -z $FC ]] && unset FC
export CMAKE_NO_VERBOSE="1"
type lsetup >/dev/null 2>/dev/null
if [ $? -ne 0 ]; then
source ${ATLAS_LOCAL_ROOT_BASE}/user/atlasLocalSetup.sh --quiet
fi
source $ATLAS_LOCAL_ROOT_BASE/packageSetups/localSetup.sh --quiet "cmake 3.21.3"
if [ -z "${AtlasSetup:+x}" ]; then
export AtlasSetup="/cvmfs/atlas.cern.ch/repo/ATLASLocalRootBase/x86_64/AtlasSetup/V02-00-44/AtlasSetup"
export AtlasSetupVersion="AtlasSetup-02-00-44"
fi
export FRONTIER_SERVER="(serverurl=http://atlasfrontier-local.cern.ch:8000/atlr)(serverurl=http://atlasfrontier-ai.cern.ch:8000/atlr)(serverurl=http://ccfrontier.in2p3.fr:23128/ccin2p3-AtlasFrontier)(proxyurl=http://ca-proxy-atlas.cern.ch:3128)(proxyurl=http://ca-proxy-meyrin.cern.ch:3128)(proxyurl=http://ca-proxy.cern.ch:3128)(proxyurl=http://atlasbpfrontier.cern.ch:3127)(proxyurl=http://atlasbpfrontier.fnal.gov:3127)"
export ATLAS_POOLCOND_PATH="/cvmfs/atlas-condb.cern.ch/repo/conditions"
export ATLAS_DB_AREA="/cvmfs/atlas.cern.ch/repo/sw/database"
export DBRELEASE_OVERRIDE="current"
export SITEROOT="/cvmfs/atlas-nightlies.cern.ch/repo/sw/master_Athena_x86_64-centos7-gcc11-opt"
export AtlasBaseDir="/cvmfs/atlas-nightlies.cern.ch/repo/sw/master_Athena_x86_64-centos7-gcc11-opt/2022-07-07T2101"
export LCG_RELEASE_BASE="/cvmfs/atlas-nightlies.cern.ch/repo/sw/master_Athena_x86_64-centos7-gcc11-opt/sw/lcg/releases"
export AtlasBuildStamp="2022-07-07T2101"
export AtlasReleaseType="nightly"
export AtlasBuildBranch="master"
export AtlasProject="Athena"
export TDAQ_RELEASE_BASE="/cvmfs/atlas.cern.ch/repo/sw/tdaq"
export ATLAS_RELEASE_BASE="/cvmfs/atlas-nightlies.cern.ch/repo/sw/master_Athena_x86_64-centos7-gcc11-opt/2022-07-07T2101"
export ATLAS_RELEASEDATA="/cvmfs/atlas-nightlies.cern.ch/repo/sw/master_Athena_x86_64-centos7-gcc11-opt/atlas/offline/ReleaseData"
export AtlasArea="/cvmfs/atlas-nightlies.cern.ch/repo/sw/master_Athena_x86_64-centos7-gcc11-opt/2022-07-07T2101/Athena/23.0.3"
export G4PATH="/cvmfs/atlas-nightlies.cern.ch/repo/sw/master_Athena_x86_64-centos7-gcc11-opt/Geant4"
export AtlasVersion="23.0.3"
source /cvmfs/atlas-nightlies.cern.ch/repo/sw/master_Athena_x86_64-centos7-gcc11-opt/2022-07-07T2101/Athena/23.0.3/InstallArea/x86_64-centos7-gcc11-opt/setup.sh
asetup_status=$?
if [ ${asetup_status} -ne 0 ]; then
\echo "AtlasSetup(ERROR): sourcing release setup script (/cvmfs/atlas-nightlies.cern.ch/repo/sw/master_Athena_x86_64-centos7-gcc11-opt/2022-07-07T2101/Athena/23.0.3/InstallArea/x86_64-centos7-gcc11-opt/setup.sh) failed"
fi
export TestArea="/afs/cern.ch/work/e/elmsheus/testarea/tensorflow-test"
alias_sys_exe emacs
echo $LD_LIBRARY_PATH | egrep "LCG_[^/:]*/curl/" >/dev/null
if [ $? -eq 0 ]; then
alias_sys_exe_envU git
fi
\expr 1 \* 1 + 1 >/dev/null 2>&1
if [ $? -ne 0 ]; then
echo -e '\nMaking workaround-alias for expr on this *OLD* machine'; alias_sys_exe expr
fi
export PATH="${ASETUP_SYSBIN}:${PATH}"
# Check the completeness in the nightly release
for onepath in $(echo $LD_LIBRARY_PATH | tr ":" "\n"); do
if [[ $onepath == ${AtlasBaseDir}* && ! -d $onepath ]]; then
echo \!\! FATAL \!\! $onepath does not exist
return 1
fi
done
#Release Summary as follows:
#Release base=/cvmfs/atlas-nightlies.cern.ch/repo/sw/master_Athena_x86_64-centos7-gcc11-opt/2022-07-07T2101
#Release project=Athena
#Release releaseNum=23.0.3
#Release asconfig=x86_64-centos7-gcc11-opt
# Execute user-specified epilog
source /cvmfs/atlas.cern.ch/repo/ATLASLocalRootBase/swConfig/asetup/asetupEpilog.sh
script_status=$?
if [ ${script_status} -ne 0 ]; then
\echo "AtlasSetup(ERROR): User-specified epilog (source /cvmfs/atlas.cern.ch/repo/ATLASLocalRootBase/swConfig/asetup/asetupEpilog.sh) reported failure (error ${script_status})"
fi
This diff is collapsed.
Click to expand it.
sub.sh
+
1
−
20
View file @
30109790
...
...
@@ -10,23 +10,4 @@
#SBATCH -c 1
# to run: sbatch sub.sh
.
./run.sh
# standelone
# workerID=9999
# nNode=1
# export PANDA_HOME=/global/cfs/cdirs/m2616/harvester-perlmutter
# export PANDA_QUEUE=NERSC_Perlmutter_GPU
# export HARVESTER_DIR=$PANDA_HOME # PANDA_HOME is defined in etc/sysconfig/panda_harvester
# export HARVESTER_WORKER_ID=${workerID}
# export HARVESTER_ACCESS_POINT=/pscratch/sd/r/rwang/tensorflow-test/workdir/${workerID}
# export HARVESTER_NNODE=${nNode}
# export HARVESTER_NTASKS=$((1 * ${nNode}))
# export HARVESTER_MAPTYPE=ManyToOne
# export wrapper_wrapper_file=$HARVESTER_DIR/etc/panda/wrapper-wrapper-3.sh
# echo [$SECONDS] "Copy $wrapper_wrapper_file into $HARVESTER_ACCESS_POINT"
# mkdir -p ${HARVESTER_ACCESS_POINT}
# cd ${HARVESTER_ACCESS_POINT}
# cp -v $wrapper_wrapper_file ./
# /bin/bash ./wrapper-wrapper-3.sh $PANDA_QUEUE $HARVESTER_ACCESS_POINT
.
./run.sh
# standelone
\ No newline at end of file
This diff is collapsed.
Click to expand it.
submit.sh
+
0
−
31
View file @
30109790
#!/bin/bash
#prun --exec="./run.sh" --outDS user.elmsheus.gputest.0003 --outputs=out.txt --site ANALY_MANC_GPU_TEST --disableAutoRetry --architecture nvidia-gpu --noBuild --container centos7
#prun --exec="./run.sh" --outDS user.elmsheus.tensorflow.0032 --disableAutoRetry --noBuild --extFile=run.sh,testtf.py --site GOOGLE_GPU --cmtConfig="centos7"
#prun --exec="./run.sh" --outDS user.elmsheus.tensorflow.0109 --disableAutoRetry --noBuild --extFile=run.sh,testtf.py --cmtConfig="centos7" --site ANALY_OU_OSCER_GPU_TEST
#prun --exec="./run.sh" --outDS user.elmsheus.tensorflow.0300 --disableAutoRetry --noBuild --extFile=run.sh,testtf.py --cmtConfig="centos7" --site ANALY_BNL_GPU_ARC
#prun --exec="./run.sh" --outDS user.elmsheus.tensorflow.0301 --disableAutoRetry --noBuild --extFile=run.sh,testtf.py --cmtConfig="centos7" --site ANALY_INFN-T1_GPU
#prun --exec="./run.sh" --outDS user.elmsheus.tensorflow.0302 --disableAutoRetry --noBuild --extFile=run.sh,testtf.py --cmtConfig="centos7" --site ANALY_MANC_GPU
#prun --exec="./run.sh" --outDS user.elmsheus.tensorflow.0303 --disableAutoRetry --noBuild --extFile=run.sh,testtf.py --cmtConfig="centos7" --site ANALY_MWT2_GPU
#prun --exec="./run.sh" --outDS user.elmsheus.tensorflow.0304 --disableAutoRetry --noBuild --extFile=run.sh,testtf.py --cmtConfig="centos7" --site ANALY_OU_OSCER_GPU_TEST
#prun --exec="./run.sh" --outDS user.elmsheus.tensorflow.0305 --disableAutoRetry --noBuild --extFile=run.sh,testtf.py --cmtConfig="centos7" --site ANALY_QMUL_GPU
#prun --exec="./run.sh" --outDS user.elmsheus.tensorflow.0306 --disableAutoRetry --noBuild --extFile=run.sh,testtf.py --cmtConfig="centos7" --site ANALY_SLAC_GPU
#prun --exec="./run.sh" --outDS user.elmsheus.tensorflow.0307 --disableAutoRetry --noBuild --extFile=run.sh,testtf.py --cmtConfig="centos7" --site DESY-HH_GPU
# prun --exec="./run.sh" --outDS user.rwang.tensorflow.`uuidgen` --disableAutoRetry --noBuild --extFile=run.sh,testtf.py --cmtConfig="centos7" --site NERSC_Perlmutter_GPU --nCore=1 --voms atlas:/atlas/Role=production
# prun --exec=". ./run.sh" --outDS user.rwang.tensorflow.`uuidgen` --disableAutoRetry --noBuild --extFile=run.sh,testtf.py --cmtConfig="centos7" --site NERSC_Perlmutter_GPU --nCore=2 --destSE MWT2_DATADISK
## single node ##
prun
--exec
=
"./run.sh"
--inDS
hc_test:mc15_13TeV.361106.PowhegPythia8EvtGen_AZNLOCTEQ6L1_Zee.evgen.EVNT.e3601_tid04972714_00
--nFiles
1
--outDS
user.
$USER
.tensorflow.
`
uuidgen
`
--outputs
my_model.h5
--disableAutoRetry
--noBuild
--extFile
=
*
.log,
*
.h5,prmon
*
--site
NERSC_Perlmutter_GPU_Test
--nCore
=
4
--architecture
nvidia
# --prodSourceLabel test
## multi node ##
# aprun -n 2 -d 8 --exec="./run.sh" --outDS user.rwang.tensorflow.`uuidgen` --outputs my_model.h5 --disableAutoRetry --noBuild --extFile=*.log,*.h5,prmon* --site NERSC_Perlmutter_GPU_Test --nCore=7 --architecture nvidia #
#ANALY_BNL_GPU_ARC : test
#ANALY_INFN-T1_GPU : brokeroff
#ANALY_MANC_GPU : online
...
...
@@ -30,13 +9,3 @@ prun --exec="./run.sh" --inDS hc_test:mc15_13TeV.361106.PowhegPythia8EvtGen_AZNL
#ANALY_QMUL_GPU : test
#ANALY_SLAC_GPU : online
#GOOGLE_GPU : offline
# --cmtConfig="centos7"
# --architecture "&nvidia-gpu"
# ANALY_MANC_GPU
# GOOGLE_GPU
#--cmtConfig nvidia-gpu@centos7
#--cmtConfig nvidia-gpu
This diff is collapsed.
Click to expand it.
Preview
0%
Loading
Try again
or
attach a new file
.
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Save comment
Cancel
Please
register
or
sign in
to comment