Purpose:
- To check if the IB on the HPC compute nodes (H/HB/HC) are showing as up
- chk_ib.py: Hook to check if eth1 is up IB enabled H16r(m) or NV24r nodes
qmgr commands
/opt/pbs/bin/qmgr -c "create hook chk_ib"
/opt/pbs/bin/qmgr -c "set hook chk_ib event=exechost_startup"
/opt/pbs/bin/qmgr -c "import hook chk_ib application/x-python default chk_ib.py"
Purpose:
- To create a job dir on the local SSD that the user can use on each node assigned to the job
- setup_jobdir.py
qmgr commands
create hook setup_jobdir
set hook setup_jobdir event="execjob_begin,execjob_end"
import hook setup_jobdir application/x-python default setup_jobdir.py
Purpose:
- To reduce jitter on the compute nodes when jobs are running
- stop_waagent.py
qmgr commands
create hook stop_wa
set hook stop_wa event="execjob_begin,execjob_end"
import hook stop_wa application/x-python default stop_waagent.py
Purpose:
- To delete all of the user processes on the nodes once the job has completed
- pbs_user_proc_cleanup.py
qmgr commands
create hook user_cleanup
set hook user_cleanup event="execjob_end"
import hook user_cleanup application/x-python default pbs_user_cleanup.py
Purpose:
- To check the memory stream performance of the node when it is boots up
- Refer to the pbsserverhooks.sh script
sudo /opt/pbs/bin/qmgr -c 'create hook nhc_run_stream'
sudo /opt/pbs/bin/qmgr -c 'set hook nhc_run_stream event="exechost_startup"'
sudo /opt/pbs/bin/qmgr -c "import hook nhc_run_stream application/x-python default $HOOKS_DIR/nhc_run_stream.py"